// Computer Program Listing Appendix Under 37 CFR 1 .52(e) 
// cache. hpp 

// Copyright (c) 2004. Sybase, Inc. All Rights Reserved. 

II ******************************************************************* 

// Copyright 1991-2003 iAnywhere Solutions, Inc. All rights reserved. 

II ******************************************************************* 

#jfndef CACHE_HPP 
#define CACHE_HPP 
class Cache; 
class CacheChain { 
public: 

CacheChainQ 
:_head(NULL) 
, _refs( NULL ) 
{ 
} 

void Latch! nfos() { 
_latch.get( _contention_counter( HASH_CONTENTION ) ); 
} 

void UnlatchlnfosO { 
Jatch.giveO; 
} 

void LatchO { 

_mutex.get( _contention_counter( HASH_CONTENTION ) ); 
} 

void UnlatchO { 
_mutex.give(); 
} 

class Pagelnfo *Find( a_cache_name name ); 
class Pagelnfo *AssuredFind( a_cache_name name ); 
class Pagelnfo *FindOrlnsert( a_cache_name name, Pagelnfo * insert ); 
void Remove( Pagelnfo * remove ); 
// Operations on cache refs 
void Add( class CacheRef * ref ); 
a_bool Remove( class CacheRef * remove ); 
private: 
friend class Cache; 
friend class CacheRef; 
Mutex Jatch; 
Mutex _mutex; 
class Pagelnfo *_head; 
class CacheRef *_refs; 

}; 

typedef unsigned a_queue_time; 

typedef a_byte a_prs_slot; 

#define PRS_TOTAL_SLOTS 128 

class DBSRVAPI Pagelnfo : public Cachelnfo { 

public: 

Pagelnfo( void * image ); 

--PagelnfoO; 



void PrepareForAclcl( a_cache_name name, unsigned now ); 

a_bool ScrubO; 

void PrepareForRead( class lOCB * iocb ); 

Pagelnfo * Reset( a_cache_name name, unsigned now ); 

inline a_bool reapable_address_space() const; // and physical frame (addr is always mapped to something) 
inline a_bool reapable_physical_frame( class Cache *cm ) const; 
inline a_bool decommitable_image() const; 
a_bool do_read_to_write_lock( Worker *me ); 
void do_write_to_read_lock( Worker *me ); 
void writeJockO; 
void add( class CacheRef *ref ); 
void remove( class CacheRef *ref ); 
void wait_for_lock( CacheChain *chain ); 
a_bool is_dirty() const { 
return( Js.dirty ); 
} 

void mark_dirty() { 
if( !is_dirty() ) { 
_file->mark_dirty( this ); 

} 

} 

void do_write( Pagelnfo *delay ); 
void writeO; 

void start_write( Pagelnfo *delay = NULL ); 

void write_and_flush(); 

void read(); 

void w_complete(); 

void r_complete(); 

void remove_delay(); 

void prep_for_read( Database *db ); 

void map(); 

void enqueue( class Cache *cache ); 

inline void set_physmem_id( class Cache *cm, a_physmem_id physmemjd ); // only used in cachespt 

inline a_physmem_id get_physmem_id( class Cache *cm ) const; 

a_bool is_pending( void ); 
#if defined( AWE_CACHE ) 

inline void map_to_physmem( class Cache *cm, a_physmem_id physmem_id ); 
#endif 
private: 

Pagelnfo *_next; //on chain 

RWLatch Jatch; 

union a_name_reuse_state { 
struct { 

uint16 ref_count; 

uint16 is_in_hash; 
} bits; 

uint32 as_cell; 

} _state; 

union { 
a_byte _flags; 



struct { 

a_byte dirty : 1 ; 

a_byte preimage_may_not_be_committecl : 1 ; 
a_byte blob_page : 1 ; 
a_byte tracked_tablej3age : 1 ; 
a_byte coldstart_recorded : 1 ; 
} Js; 

}; 

uint16 _tid; 
unsigned _visited_at; 
a_prs_slot _score; 

union { // only meaningful when _is.preimage_may_not_be_committed == TRUE 
a_physical_page _checkpoint_log_pos; 
a_page_id _rollback_page_no; 

}; 

a_page_id _real_page_no; // != page_no if mapped 
class lOCB * _pending; 

enum { // Overloaded values for _pending. Must have low bit on. 
REUSABLE = 1 , 
JUSTJNSTALLED = 3, 
IMAGE_MISSING = 5, 
PINNED = 7 

}; 

#if IPRODUCTION 

a_debug_count firstjock; // for debugging 
a_debug_count first_write; // for debugging 
#endif 

#ifdef CHECKSUM 

unsigned checksum; 
#endif 

// Unprotected by Jatch. 

a_ptrint _queue_slot; 
public: 

a_bool read_to_write_lock(); 

void write_to_read_lock(); 

void unlockO; 
#if IPRODUCTION 

void verifyO; 
#endif 
public: 

a_bool HasName( a_cache_name name ) const { 
return( _name.as_uint == name.as_uint ); 
} 

a_bool IsReusableO const { 
return( J3ending == (lOCB *) REUSABLE ); 
} 

a_bool IsMissinglmageO const { 
return( j)ending == (lOCB *) IMAGE_MISSING ); 
} 

a_bool IsPinnedO const { 



return( jDending == (lOCB *) PINNED ); 
} 

a_bool IsDirtyO const { 
return( Js. dirty ); 
} 

a_bool IslnHashO const { 
return( _state.bits.is_in_hash ); 
} 

a_bool IsAddressableO const { 
return( Jmage != NULL ); 
} 

void MarklmageAsMissingQ { 
_pending = (lOCB *) IMAGE_MISSING; 
} 

void MarklmageAsAvailableO { 
jDending = NULL; 
} 

a_bool Latch( class Cache * cm, a_cache_name name, a_bool shared = FALSE ); 

void Latch( a_bool shared = FALSE ) { 
if( shared ) { 

_latch.get_shared(); 
} else { 

_latch.get_exclusive(); 

} 

} 

a_bool TryLatch( a_bool shared = FALSE ) { 
return( shared? _latch.try_get_shared() : _latch.try_get_exclusive() ); 
} 

void ExclusiveToSharedO { 
_latch.exclusive_to_shared(); 
} 

a_bool SharedToExclusiveO { 
return( _latch.shared_to_exclusive() ); 
} 

a_bool TrySharedToExclusiveO { 
return( _latch.try_shared_to_exclusive() ); 
} 

a_bool IsLatchedO const { 
return( _latch.havejatch() ); 

} 

a_bool IslnUseO const { 
return( IsLatchedQ || lsPinned() ); 
} 

#if IPRODUCTION 

a_bool HaveExclusivelyO const { 
return( _latch.have_exclusive_latch() ); 

} 

#endif 

void UnlatchQ { 
_latch.give(); 



} 

void UnlockO { 
UnlatchO; 
} 

void WaitForPendingO { 
if( _pending ) { 

DoWaitForPendingO; 

} 

} 

void WaitForPreimageO { 
if( _is.preimage_may_not_be_committed ) { 
Do WaitForPreimageO; 

} 

} 

void Shrink( Cache * cm ); 
a_bool IsShrinkableO; 
a_bool CanCommitO; 
void CommittedO; 
void Pin(); 
void Unpin(); 
void WriteAndEvictO; 
void EvictQ; 



private: 






friend 


class 


Cache; 


friend 


class 


PageQueue; 


friend 


class 


CacheChain; 


friend 


class 


CacheRef; 


friend 


class 


Cachelnfo; 


friend 


class 


Info Friend; 


friend 


class 


Database File; 


friend 


class 


CheckpointLog; 


friend 


class 


lOCB; 



void RecordHit( class Cache * cm ); 

a_bool CanPreventReuseO; 

a_bool AllowReuseO; 

a_bool SetlnHash( a_bool in_hash ); 

a_bool IsReapableO const; 

void CleanO; 

void FinishLock( a_bool shared ); 
void AssertNotFree( Database * db ); 
class lOCB * StartReadO; 
class lOCB * StartWrite( a_bool evict = FALSE ); 
void SetPrelmage( aj3age_id page_no ); 
void Write( a_bool wait = FALSE ); 
void DoWaitForPendingO; 
void DoWaitForPreimageO; 
a_bool JustlnstalledO const { 
return J3ending == (lOCB *) JUSTJNSTALLED; 
} 

a_bool IsColdstartRecordedO const { 



return _is.coldstart_recorclecl; 

} 

void SetColdstartRecorded( a_bool val ) { 
_is.coldstart_recorded = (a_byte) val; 

} 

}; 

//_pending codes: iocb pointer 

// 1 => reserved for local thread 

// 2 => address space missing 

// 3 => need data 

// 4 => free 

// 5 => reusable 

// 6 => allocated for image 

// A page_ref is in some chain iff page_no is not NULL_PAGE. 

// The page pointed to by a page_ref is locked iff page is not NULL. 

#define SUPJNDEX 65535 

class DBSRVAPI CacheRef : public HeapObject { 

public: 

CacheRefO 
: _chain( NULL ), _info( NULL ), _flags( 0 ) 

{ 

_name.as_member.page_no = NULL_PAGE; 
} 

CacheRef( a_database_number db_no, a_page_id page_no ); 
CacheRef( a_database_number db_no, a_record_id const &id ); 
CacheRef( Pagelnfo *info ) { 
force( info ); 
} 

--CacheRefO { 
releaseRefsO; 
} 

CacheRef ( CacheRef const &ref ); 

CacheRef & operator= ( CacheRef const &ref ); 

void Set( a_database_number db_no, a_record_id const &id ); 

void Add( a_cache_name name, a_page_count index = 0 ); 

void RemoveO; 

void Latch( a_bool shared = FALSE ); 

void Latch( a_cache_name name, a_bool shared ); 

void Lock( a_bool shared = FALSE ) { 
Latch( shared ); 
mark_dirty( shared ); 

} 

void Lock( a_cache_name name, a_bool shared = FALSE ) { 

Latch( name, shared ); 
mark_dirty( shared ); 
} 

void UnlockO; 

CacheChain *LatchChain() const; 

void force( Pagelnfo *info ); 

void force( Pagelnfo *info, a_page_count index ); 



void finishO { 

releaseRefsO; 
_is.cleleted_at = FALSE; 
_is.inserted_at = FALSE; 
} 

a_bool is_deleted() const { 
return( _is.deleted_at ); 
} 

a_bool is_on_page() const { 
return( _name.as_member.page_no != NULL_PAGE ); 
} 

void *page() const { 
return( _info? _info->_image : NULL ); 
} 

Pagelnfo *info() const { 
return( Jnfo ); 
} 

a_page_id page_no() const { 
return( _name.as_member.page_no ); 
} 

a_page_count indexQ const { 
return( Jndex ); 
} 

a_bool validO const { 
return( !_is.page_deleted ); 
} 

a_bool lookupJnvalidO const { 
return( _is.deleted_at || _is.inserted_at ); 
} 

void read_lock_page() { 
Lock( TRUE ); 

} 

void read_lock_page( a_database_number db_no, aj3age_id page_no ) { 
Lock( NameFor( db_no, page_no ), TRUE ); 
} 

void read_lock_coupie( a_page_id page_no ) { 
lock_couple( page_no, TRUE ); 
} 

void write_lockj3age() { 
LockO; 
} 

void write_lock_page( a_database_number db_no, aj3age_id page_no ) { 
Lock( NameFor( db_no, page_no ) ); 
} 

void writeJock_couple( ajDageJd page_no ) { 
lock_couple( page_no, FALSE ); 
} 

void unlock_page(); 

a_bool move_to( a_page_id page_no, a_page_count index ); 
void lock( a_bool shared ) { 



Latch( shared ); 
mark_dirty( shared ); 
} 

void lock_couple( a_page_id page_no, a_bool shared ); 

Page Info *transfer_lock() { 
// FIXME: This is a hack that should be done away with. 
_assertD( Js. locked ); 
Js. locked = FALSE; 
return( _info->_image ? _info : NULL ); 

} 

a_bool return_lock( Cachelnfo * info ) { 
_assertD( Ms. locked && info != NULL ); 
if( (Pagelnfo *) info == Jnfo ) { 

Js. locked = TRUE; 

return( TRUE ); 

} 

return( FALSE ); 
} 

void releaseRefsO; 
void lock_clean( a_bool shared ) { 
Latch( shared ); 
} 

void mark_dirty( a_bool shared = FALSE ) { 
if( Ishared && Jnfo != NULL ) { 
Jnfo->mark_dirty(); 

} 

} 

void writeJock_cleanj3age() { 
LatchO; 

} 

void unlockO { 
Js.locked = FALSE; 
Jnfo->Unlock(); 

} 

protected: 

friend class Cache; 

void remove JromJocked_page(); 

void clone( CacheRef const &ref ); 

void latchO const; 
public: 

CacheRef *_next; 

CacheChain *_chain; 

Pagelnfo *Jnfo; 

a_cache_name _name; 
public: 

a_page_count Jndex; 

union { 
struct { 

uint1 6 where : 8; // Where could we be in the scan? 
// LESS => value is less than left fencepost 



// EQUAL => value is between fenceposts 

// GREATER => value is greater than right fencepost 

//NB: 

// 1) Missing fenceposts essentially treated as infinite. 
// 2) After a comparison, only set according to value. 
uint16 pinned_to_page : 1; 
uint16 page_deleted : 1; 
uint16 reversed : 1; 
uint16 via_bitmap : 1; 
uint1 6 deleted_at : 1 ; 
uint16 inserted_at : 1; 
uint16 locked : 1; 
} _is; 

uint16 _flags; 

}; 

protected: 

void latch_and_do_add_to_page( a_database_number db_no, a_page_id page_no ); 

}; 

class DBSRVAPI lOCB : public DeferredIO { 
public: 

lOCBO 
: _info( NULL ) 

{ 

} 

void LatchO { 
_mutex.get(); 
} 

a_bool TryLatchO { 
return( _mutex.try_get() ); 
} 

void UnlatchO { 
_mutex.give(); 
} 

a_bool Finish( a_bool wait, a_bool respect_evict ); 
a_bool Finish( Pagelnfo * info, a_bool wait, a_bool respect_evict ); 
a_bool DoFinish( Pagelnfo * info, a_bool wait, a_bool respect_evict ); 
a_bool lsActuallyPending( void ); 
private: 

friend class DatabaseFile; 
friend class SysFile; 
friend class Cache; 
friend class Pagelnfo; 
Pagelnfo *Jnfo; 

an_ioreq_type _io_type; // PJB TODO: set counter type 
union { 
struct { 

uintS to_be_evicted; 

} _is; 

uintS _flags; 

}; 



uint32 _mask; 
Mutex _mutex; 
CondVar _finishecl; 

}; 

#enclif 

// cachespt.cpp 

// Copyright (c) 2004. Sybase, Inc. All Rights Reserved. 

II ******************************************************************* 

// Copyright 1997-2003 lAnywhere Solutions, Inc. All rights reserved. 

II ******************************************************************* 

// Mode: C++ -*- 

// 

// One stop shopping for memory. 

// 

// Contiguous array of infos point to exactly one image (that may or may 

// not be addressable). Address space is allocated immediately, and committed 

// as needed. 

// Age scores of pages as we check. Have rover that checks. 
// 

// Replace grab_frame with explicit copy (locking pages). 

// Use TryLock to reduce the number of times we need to give up a lock 

// in order to delete a page. 

// 

// Have 2 reusable arrays: with and without address space. Try for page 
// with address space first, then for page without and troll for address 

// space. 

// Need quarantine (even for blocking hash implementation). We can't reuse 
// an info while an attempt is being made to latch it (but we can remove it). 
// We put removed entries into a quarantine, and from there into the free 
// queues. We need per task hazard pointers. 

// 

// We should do a TryLatch operation first and only invoke the expensive 
// operations when contention is detected. 

// 

// We could mark page as being quarantined (not eligible for reuse) if we 
// need to block. Have bits to mark info as free/guarded. Mark as guarded 
// if we need to block for latch. 

// For old databases, keep page number of pre-image. When attempting to 

// to write a page with a pre-image, see if we can latch pre-image, and if 

// so wait for lO to finish (will disappear from cache when done). 

// Would like to wait for an iocb only if it belongs to a particular info 

// We need a count of references + indication that would like to change name 

// When count is 0 then we can change name; reset counter when we allocate 

// 

// ? Attempt to flush dirty page from cache -> start write, page marked 
// as going out, unlock page -> attempt to read page -> get shared access 
// and claim IOCB -> if we need page, do not evict. 

// 

// Resource orderings: 

// Pages must be latched before pending lOCBs 



// A page must be latched before its pre-image 
#inclucle "dbprecom.h" 
#if defined( _MSC_VER ) 
#pragma hdrstop 



#endif 




#include 


"cachespt.hpp" 


#include 


"cachedef.hpp" 


#include 


"rnthread.h" // for MAX_STACK_SIZE 


#include 


"rnsqipro.h" 


#include 


"vmem.hpp" 


#include 


"cachesize.hpp" 


#include 


"dosbox.h" 


#include 


"dbglobal.h" 


#include 


"ksynch.hpp" 


#include 


"dbstart.h" 


#include 


"dbmulti.h" 


#include 


"wcsupprt.hpp" 


#include 


"pagemap.h" 


#jnclude 


"pagectr.hpp" 


#include 


"rnconnec.h" 


#include 


"ichkptlog.hpp" 


#include 


"osintf.hpp" 


#include 


"dbstate.h" 


#include 


"dfsys.h" 


#include 


"dfcio.h" 


#include 


"dbyield.h" 


#include 


"pagegrp.hpp" 


#include 


"utiangstring.hpp" 


#jnclude 


"dbautockpt.hpp" 


#include 


"storeifs.hpp" 


#include 


"strids.h" 


#include 


"cache, hpp" 


#include 


"cachersv.hpp" 


#include 


"cachedyn.hpp" 


#include 


"cacheawe.hpp" 


#include 


"dbcoldstart.hpp" 


#include 


"dbtrace.hpp" 



// #undef AWE_CACHE 
// PJB FIXME: To be removed, 
inline p_Database LookupDBID( uint32 id ) { 
return( Eng->db.lookup( id ) ); 

} 

inline p_Database DBFromlD( uint32 id ) { 
return( LookupDBID( id ) ); 

} 

#define _grant_image_access() 
#def ine _revoke_image_access() 
#if defined( VM_PROTECT ) 

#define MIN_CACHE_PAGE_BITS 12 
#elif defined( POINTERS_ARE_64BITS ) 



// dec unix (which is a 64 bit platform) requires min of 2K page 
// this is due to some data structures which have exceeded the 1 K page 
// limit due to the doubling of pointers in the structures. 
#define MIN_CACHE_PAGE_BITS 11 
#else 

// all other platforms require at least 10 bits (1024 bytes) 
#define MIN_CACHE_PAGE_BITS 10 
#endif 

// #define MAX_IOCB 5 // make it small to test blocking logic 
#if defined( UNDER_CE ) 
#define MAX_IOCB 50 
#else 

#define MAXJOCB 255 
#endif 

#define ALL_FILES -1 

#define MAPPED_PAGES -2 

#if PRODUCTION < 1 

a_bool DisableAssertNotFree = FALSE; 

#endif 

class DBSRVAPI IdlelOTimer : public ATimer { 
public: 

IdlelOTimerO; 

void dispatchO; 
private: 

unsigned _rover; 

}; 

static Cache * XM = NULL; 
Cachelnterface * CM = NULL; 
// PJB FIXME: needs to be native, 
typedef atomic32 atomic_ptrint; 
class PageQueue { 
public: 

PageQueueO; 

void lnitialize( Pagelnfo **queue ); 
void Resize( Cache * cm, a_ptrint size ); 
void Enqueue( Pagelnfo * info ); 
Pagelnfo * DequeueQ; 
private: 

Pagelnfo ** _queue; 
a_ptrint _size; 
a_ptrint _threshold; 
atomic_ptrint _head; 
atomicj3trint_tail; 

}; 

class Cache : public Cachelnterface { 
public: 

Cache( p_engine_parms ep, AWEInterface * awe ); 

-CacheO; 

a_bool IsUpAndRunningO const { 
return( XM == this ); 



} 

an_image_set * get_images() { 
return( &_images ); 
} 

Pagelnfo * LockRaw( a_cache_name name, a_bool shared = FALSE ) { 
Pagelnfo * info = lnstall( name, shared ); 
info->FinishLock( shared ); 
return( info ); 

} 

Pagelnfo * Lock( a_cache_name name, a_bool shared = FALSE ); 
unsigned Hint( a_cache_name name ); 
void *Alloclmage( Cachelnfo ** pinfo ); 
void Freelmage( Cachelnfo * info ); 

void *multi_page_alloc( uint32 num_pages, uint32 page_size, MultiPageAlloc *handle ); 
void multi_page_free( MultiPageAlloc *handle ); 

void Evict( a_cache_name name ); 

void FlushDBFromCache( a_database_number db_no, a_bool is_scrammed ) { 
Evict( db_no, ALL_FILES, is_scrammed ); 
} 

void FlushMappedPages( a_database_number db_no ) { 
Evict( db_no, MAPPED_PAGES, TRUE ); 
} 

void FlushCacheForFileDrop( a_database_number db_no, unsigned file_no ); 

void sa_flush_cache( p_database db ); 

void Flush( p_database db ); 

a_ptrint likely_available(); 

a_ptrint ^virtual CacheMax() { 

// Outside of the cache manager, "CacheMax" is used as an 
// indication of the number of pages in the cache; however, 
//with dynamic cache sizing, _config._current.cache_max() 
// indicates the number of *frames* which could be larger 
// than the number of committed images if there are holes in 
// the image address space 
return( _config._current._n_committed_images ); 

} 

#if IPRODUCTION 

void CheckForLockedPages( int db_no ); 
#endif 

void adjust( DoAdjust *cb. Database *db, a_page_id pO, a_page_id p1, a_page_id p2 ); 
a_bool WaitAnyO; 

void WaitAII( a_database_number db_no ); 
void WaitForExtend( Pagelnfo * extend ); 
void WaitUntilClean( IDatabaseFile * file ); 
lOCB * GetlOCB( Pagelnfo * info ); 
void PrelOO; 
void PostlOO; 
void Add( CacheRef * ref ); 
// Depricated wrappers. 

void evict( Database *db, a_page_id page_no ) { 
Evict( NameFor( db->id(), page_no ) ); 



} 

unsigned hint( Database * db, a_page_id page_no ) { 
return( Hint( NameFor( db->id(), page_no ) ) ); 
} 

unsigned hint( a_page_id page_no ) { 
return( hint( _CurrentDB, page_no ) ); 
} 

// NB Don't need DIO_Wait_AII before call to this, 
void flush_db_from_cache( p_database db, a_bool is_scrammed ) { 
FlushDBFromCache( db->id(), is_scrammed ); 
} 

void flush_mapped_pages( p_database db ) { 
FlushMappedPages( db->id() ); 
} 

void flush_cache_for_table_drop( p_database db, unsigned file_no ) { 
FlushCacheForFileDrop( db->id(), file_no ); 
} 

void flush( p_database db ) { 
Flush( db ); 
} 

a_ptrint ^virtual cache_max() 

{ 

return( ^virtual CacheMax() ); 

} 

#if IPRODUCTION 

void check_if_still_used_at_commit( p_database db, Cachelnfo *def_page ) { 
ChecklfStillUsedAtCommit( db->id(), def_page ); 
} 

void check_for_locked J3ages( int db_no ) { 
CheckForLockedPages( db_no ); 
} 

#endif 

void hint_page_group( PageGroup *pagegrp, aj3age_id start, uint32 pages_wanted ); 
void cache_message( void ); 
void engine_startup_complete(); 
a_ptrint cache_available_images(); 
a_ptrint cache_available_addr(); 

a_bool enoughj3ages_available( uint32 numj3ages, a_bool grow_cache_if_necessary ); 
void kick_auto_resize(); 
DynamicCacheConfig * min_config() { 
return( &_config._minimum ); 
} 

DynamicCacheConfig * max_config() { 
return( &_config._maximum ); 
} 

DynamicCacheConfig * current_config() { 
return( &_config._current ); 
} 

DynamicCacheConfig * initial_config() { 
return( &_config._initial ); 



} 

a_bool resize_cache( uint64 newsize ); 
#if clefinecl(DYNAMIC_CACHE_SIZE) 

a_bool suspend_resizing(); 

a_bool resume_resizing(); 

a_bool resizing_suspencled() const; 
#enclif 

uint64 current_cache_size() { 
return( _config._current.cache_size() ); 
} 

uint64 minimum_cache_size() { 
return( _config._minimum.cache_size() ); 
} 

uint64 maximum_cache_size() { 
return( _config._maximum.cache_size() ); 
} 

Cachelnfo *read_lock( p_database db, a_page_id page_no ) { 
return( Lock( NameFor( db->id(), page_no ), TRUE ) ); 
} 

Cachelnfo *write_lock( p_database db, a_pagejd page_no ) { 
Pagelnfo * info = Lock( NameFor( db->id(), page_no ) ); 
info->mark_dirty(); 
return( info ); 

} 

Cachelnfo *writeJock_clean( p_database db, a_page_id page_no ) { 
return( Lock( NameFor( db->id(), page_no ) ) ); 
} 

Cachelnfo *write_lock_raw( p_database db, a_page_id page_no ) { 
return( LockRaw( NameFor( db->id(), page_no ) ) ); 
} 

a_pthnt Clean( Database *db, unsigned rover, unsigned count ); 
private: 

friend class lOCB; 

friend class CacheRef; 

friend class PageQueue; 

a_pthnt ordinal( Pagelnfo * info ) { 
return( info -Jnfo ); 

} 

a_byte * ordinal_to_image( a_ptrint ordinal ) { 
return( _images.ordinal_to_image( ordinal ) ); 
} 

CacheChain *ChainFor( a_cache_name name ) { 
return( &_page_hash[name.as_member.page_no%_hash_max] ); 
} 

// Basic cache operations. 

Pagelnfo * AddToHash( CacheChain * chain, a_cache_name name, Pagelnfo * alloc ); 

Pagelnfo * Alloc(); 

void Free( Pagelnfo * info ); 

void AddToReusable( Pagelnfo * info ); 

Pagelnfo * AllocReusable(); 



Pagelnfo * lnstall( a_cache_name name, a_bool shared = FALSE ); 

Cachelnfo * lnstall( a_clatabase_file * f, a_page_icl page_no, a_page_id real_page_no ); 

Pagelnfo * lsNotlnCache( a_cache_name name ); 

Pagelnfo * lslnCache( a_cache_name name ); 

Pagelnfo * LatchlflnCache( a_cache_name name ); 

a_bool lslmmediatelyLatchable( a_cache_name name ); 

a_bool lslOPending( a_cache_name name ); 

Pagelnfo * Scavenge(); 

a_bool CanScavenge( Pagelnfo * info, class ScavengeState * state ); 
Pagelnfo * Panic(); 
#if defined( AWE_CACHE ) 

#define TAG_UNMAPPED(x) ((void*)(((a_ptrint)(x))|1)) 
#define STRIP_TAG(x) ((a_byte*)(((a_ptrint)(x))&~1)) 
#define IS_UNMAPPED(x) ((((a_ptrint)(x))&1) != 0) 

void MakeAddressable( Pagelnfo * info ) { 
if( !info->lsAddressable() || IS_UNMAPPED( info->_image ) ) { 
DoMakeAddressable( info ); 

} 

} 

void DoMakeAddressable( Pagelnfo * info ); 
#else 

void MakeAddressable( Pagelnfo * info ) { 
_unused( info ); 
} 

#endif 

a_bool RemoveFromHash( Pagelnfo * info ); 

void Evict( a_database_number db_no, unsigned file_no, a_bool is_scrammed ); 
void FlushPages( Database *db, struct a_flushed *flushed, unsigned n ); 
void DoFlush( p_database db, a_bool flush_temp ); 
#if IPRODUCTION 

void CacheError( Pagelnfo *info, a_cache_error error ); 

void ChecklfStillUsedAtFileDrop( a_database_number db_no, unsigned file_no ); 

void ChecklfStillUsedAtCommit( a_database_number db_no, Cachelnfo *def_page ); 
#endif 
private: 

class lOGIobals { 

public: 
lOGIobalsO; 

private: 
friend class Cache; 
lOCB iocb[MAX_IOCB]; 
unsigned rover; 
IdlelOTimer idle_timer; 

} Jo; 
private: 

friend class Pagelnfo; 

a_ptrint avail_infos() const { 
return( _config._current._n_infos ); 

} 

// Page access. 



Pagelnfo * Jnfo; // Contiguous array of all infos. 

unsigned _rover; // cycles through infos 
PageQueue _reusable; // a reusable info 
atomic_ptrint _pinned_images; 
// Page naming. 

CacheChain * _page_hash; // Where the pages live. 

unsigned _hash_max; // Number of chains. 

// Page scoring. 
#define SEGMENTS_IN_CACHE 32 
#define MAX_SCORE SEGMENTSJN_CACHE 
#define MAX_THRESHOLD (SEGMENTSJN_CACHE/2) 

unsigned _now; // Current "time". 

unsigned _delta; // Window size (increment score). 

unsigned Jncr; 

void SetPageScoringParametersO { 
_delta = cache_available_images()/SEGMENTS_IN_CACHE; 
if( _delta == 0 ) _delta = 1 ; 
Jncr = sqrt((double)_delta); 

} 

private: 

void assert_page_no( Database *db, a_page_id page_no, void *page ) { 
// This check is hard-wired for performance reasons 
if( *(uint32 *)page != page_no ) { 
dump_page( db, page, page_no ); 
_assertP( 101412, FALSE, 
"Page number on page does not match page requested" ); 

} 

} 

an_image_set Jmages; 
#if defined( AWE_CACHE ) 
private: 

AWECache _awe_cache; 

Pagelnfo ** _frame_owner; 

a_ptrint _frame_rover; 
#endif 

a_bool awe_enabled() { 

// The code is cleaner in some places if this function is defined 
// on non-awe platforms as well. 

#if defined( AWE_CACHE ) 
return( _awe_cache.enabled() ); 
#else 

return( FALSE ); 
#endif 

} 

CacheAllocator _allocator; 
void recompute_headroom() { 
#if defined(DYNAMIC_CACHE_SIZE) 

_headroom = _auto_resize? _config._maximum._n_committed_images - 

_config._current._n_committed_images : 0; 
#else 



_heaclroom = 0; 
#enclif 
} 

a_ptrint _heaclroom; 
private: 

a_bool Growlnfos( a_ptrint to_commit ); 

a_ptrint Commitlmages( a_ptrint lo, a_ptrint to_commit ); 

a_bool recommit( void *p, a_ptrint olcl_count, a J3trint new_count, a_ptrint item_size ); 
#if definecl(DYNAMIC_CACHE_SIZE) 
private: 

void after_cache_size_change(); 

a_ptrint Growlmages( a_ptrint to_commit ); 

a_bool grow( a_ptrint to_commit ); 

a_bool grow_cache( DynamicCacheConfig &config ); 

a_bool grow_cache_by_images( a_ptrint numjmages ); 
#if IPRODUCTION 

void debug_images(); 
#else 

void debugJmagesO {} 
#endif 

#if defined( ALLOW_CACHE_TO_SHRINK ) 

a_bool lsShrinkable( Pagelnfo * info ); 
#endif 

void shrink_images( a_ptrint to_decommit ); 
a_ptrint FindRange( a_ptrint hi, a_bool is_shrinkable ); 
a_ptrint Decommit( a_ptrint lo, a_ptrint hi, a_ptrint max ); 
a_bool shrink_cache( DynamicCacheConfig &config ); 
private: 

Mutex _cache_growth_mutex; 

CacheAutoResizeTimer *_auto_resize; 
#endif 

CacheBounds _config; 
#if defined( LINUX) 

a_bool _touch_page_before_use; 
#endif 

}; 

static inline void 

SuicideOnFatalErrorO 

^******************* I 

{ 

if( DB_Fatal_error != SQLSTATE_NOERROR ) { 
_CurrentWorker->suicide( -1 ); 
} 

} 

Cachelnterface::Cachelnterface( p_engine_parms ep ) 

I************************************************* I 

: _db_page_bits_max ( ep->page_bits ) 

, _db_page_size_max ( 1 «_db_page_bits_max ) 

, _db_page_mask_max ( - (a_ptrint)_db_page_size_max ) 

> _os_page_size ( OS_PageSize() ) 



, _os_page_bits ( log2( _osj3age_size ) ) 

, _alignment_amount ( _max( _clb_page_size_max, _os_page_size ) ) 
, _orclinal_alignment( _alignment_amount/_clb j3age_size_max ) 

{ 

CM = this; 

} 

Cachel nterf ace : :~Cachel nterface() 

^*******************************^ 

{ 
] 

PageQueue::PageQueue() 

: _queue( NULL ) 
, _size ( 0 ) 

, _threshold( 3 ) // PJB FIXME: should be based on number of threads 

, _head ( 0 ) 
, _tail (0 ) 

{ 
} 

void 

PageQueue::lnitialize( Pagelnfo **queue ) 

^***** ************** ******************** I 
{ 

_queue = queue; 

} 

void 

PageQueue::Resize( Caclie * cm, a_ptrint size ) 
I******************************************** I 

{ 

if( cm->recommit( _queue, _size, size, sizeof(Pagelnfo *) ) ) { 

_size = size; 

Pagelnfo * high = &cm->_info[cm->_config._current._n_infos]; 
for( a_ptrint i = 0; i < size; ++i ) { 

if( _queue[i] >= high ) { 
_queue[i] = NULL; 

} 

} 

} 

} 

void 

PageQueue::Enqueue( Pagelnfo * info ) 

I*********************************** I 

{ 

if( ((a_ptrint) (info->_queue_slot - _tail)) >= _size || 
_queue[info->_queue_slot%_size] != info ) { 
if( (_head - _tail) < (_size - _threshold) ) { 
_queue[(info->_queue_slot = _head++)%_size] = info; 

} 

} 



Pagelnfo * 

PageQueue::Dequeue() 

^****************** I 

{ 

return( Lhead -_tail) > _thresholcl? _queue[(_tail++)%_size] : NULL ); 

} 

static void 

Check_availablej)hysical_memory( uint64 cache_size, uint64 phys_avail ) 
{ 

#if !defined( WINNT ) && !defined( UNIX ) 

_unused( cache_size ); 

_unused( phys_avail ); 
#else 

#if defined( WINNT ) 
if( lsWindows95() ) return; 

#endif 

#if defined( UNIX) 

if( OS_TotalPhysicalMemory() == 0 ) return; 
#endif 

if( cache_size > phys_avail ) { 
startup_insg( IDS_ENG_CACHE_EXCEEDS_PHYS_MEM, 
(uint32)(cache_size/_u64_const(1024)), 
(uint32)(phys_avail/_u64_const(1 024)) ); 

} 

#endif 
} 

Cache: :Cache( p_enginej3arms ep, AWEInterface * awe ) 

***************************** ***************** I 

: Cachelnterface( ep ) 
#if defined( AWE_CACHE ) 

, _awe_cache( this, awe ) 
#endif 

, _images( _dbj3age_bits_max ) 
, _now( 0 ) 
, _rover( 0 ) 

{ 

uint64 phys_avail; 
#if !defined( AWE_CACHE ) 

_unused( awe ); 
#endif 

_pinned_images = 0; 

// Save the amount of physical memory available at this point in time. On platforms 
// where we cannot reserve/commit memory separately, we will want to compare the cache 
// size against this value later. 
phys_avail = OS_AvailablePhysicalMemory(); 
// Determine possible range of cache sizes. 
_config.init( ep, awe_enabled() ); 
if( !awe_enabled() ) { 
if( !_allocator.init( maximum_cache_size(), _alignment_amount ) ) { 



return; 

} 

// Cache size may have changed. 
if( !_config.fixup( _allocator.size() ) ) { 
return; 

} 

} 

#if defined( AWE_CACHE ) 
else { 

if( !_allocatorjnit(_config._maximum.cache_size_without_images(), _alignment_amount ) ) { 
return; 

} 

} 

#endif 

_config._initial = _config._current; // save for future reference 
if( !awe_enabled() ) { 
Check_availablej3hysical_memory( _config._initial.cache_size(), phys_avail ); 
} 

#if defined( DYNAMIC_CACHE_SIZE ) 
_auto_resize = ep->auto_resize? new CacheAutoResizeTimer( this ) : NULL; 
#endif 

recompute_headroom(); 
#if defined( DYNAMIC_CACHE_SIZE ) 
#define _pick_alignment(static_cache,dynamic_cache) (dynamic_cache) 

#else 

#def ine _pick_alignment(static_cache,dynamic_cache) (static_cache) 
#endif 

a_ptrint to_commit = _config._current._n_committed_images; 
_config._current._n_infos = 0; 
void * alloc = 

_allocator.alloc( 0, _config._maximum._n_infos, sizeof(Pagelnfo), 
_pick_alignment( sizeof(uint64), _os_page_size ) ); 
if( alloc == NULL ) return; 
Jnfo = (Pagelnfo *) alloc; 
alloc = 

_allocator.alloc( 0, _config._maximum._n_reusable, sizeof(Pagelnfo*), 
j)ick_alignment( sizeof(uint64), _os_page_size ) ); 
if( alloc == NULL ) return; 
_reusable.lnitialize( (Pagelnfo **) alloc ); 
_reusable.Resize( this, _config._current._n_reusable ); 

// FIXME: _hash_max does not currently change when the cache changes size. 
_hash_max = _config._current._n_hash_chains; 
J3age_hash = (CacheChain *) 
_allocator.alloc( _hash_max, 

_co nf ig ._m ax i m u m ._n_h as h_c h ai ns , 

sizeof(CacheChain), 

j3ick_alignment( sizeof(uint64), _os_page_size ) ); 
if( _page_hash == NULL ) return; 
for( unsigned i = 0; i < _hash_max; ++i ) { 
new ( & j3age_hash[i] ) CacheChain; 



} 

if( !awe_enabled() ) { 
_assertD( to_commit == _config._current._n_committed_images ); 
_config._current._n_committecl_images = 0; 
unsigned numj3ieces; 
const an_aligned_allocation_piece *p = 

_allocator.alloc_piecewise( 0, _config._maximum._n_committed_images, 

_db_page_size_max, 

_pick_alignment( _db_page_size_max, 
_alignment_amount ), 

MAX_IMAGE_ADDRESS_SPACE_RANGES, 

&num_pieces ); 
if( p == NULL ) return; 
for( unsigned i = num_pieces; i-- > 0; ) { 

_images.set_range( i, p[i].mem(), p[i].size() ); 

} 

// PJB FIXME: Too drastic? 
if( !Growlnfos( to_commit ) ) return; 
if( Commitlmages( 0, to_commit ) != 0 ) return; 
} 

#if defined( AWE_GACHE ) 
else { 

if( !_awe_cache.allocate_physical_memory( ep, _config._current.size_of_images() ) ) { 
return; 

} 

_frame_owner = (Pagelnfo **) malloc(_awe_cache._addr_space*sizeof(Pagelnfo*)); 
if( _frame_owner == NULL ) { 
return; 

} 

memset( _frame_owner, 0, _awe_cache._addr_space*sizeof(Pagelnfo*)); 
_frame_rover = 0; 

if( _awe_cache._n_dbpage_frames < to_commit ) { 

startup_msg( IDS_ENG_AWE_DID_NOT_ALLOCATE_EXPECTED_PHYSMEM, 
(uint32)(((uint64)to_commit*(uint64)_db_page_size_max) / _u64_const(1 024)), 

(uint32)(((uint64)_awe_cache._n_dbpage_frames*(uint64)_db_page_size_max) / _u64_const(1024)) ); 
to_commit = _awe_cache._n_dbpage_frames; 

_config._current._n_committed_images = _awe_cache._n_dbpage_frames; 

} 

if( !_awe_cache.allocate_address_space() ) { 
return; 

} 

if( !Growlnfos( to_commit ) ) return; 

// Images will gain addressability on demand. 

for( unsigned 1 = 0; 1 < _config._current._n_infos; ++i ) { 

Pagelnfo * info = &_info[i]; 

info->_image = NULL; 

info->Committed(); 

} 

} 

#endif 



Set PageSco ri ng Parameters () ; 

XM = this; 

_engine_statistic_set( CACHE_PINNED, _pinnecljmages ); 
_engine_statistic_set( MAI N_HEAP_P AGES, 0 ); 
Cachelnfo * info; 

void *image = Alloclmage( &info ); 
DV_lnitMainHeap( image, info, _clb_page_size_max ); 

_engine_statistic_set( CURRENT_CACHE_SIZE, current_cache_size()/1024 ); 

_engine_statistic_set( PEAK_CACHE_SIZE, current_cache_size()/1 024 ); 

_engine_statistic_set( MIN_CACHE_SIZE, minimum_cache_size()/1 024 ); 

_engine_statistic_set( MAX_CACHE_SIZE, maximum_cache_size()/1024 ); 

#if defined( LINUX) 
_touch_page_before_use = FALSE; 
int major, minor, patch; 

if( OS_Version( &major, &minor, &patch ) > 0 ) { 

if ( major == 2 && minor == 2 && patch < 1 7 ) { 
_touch j3age_before_use = TRUE; 

} 

} 

#endif 

} 

a_ptrint 

Cache::Commitlmages( a_ptrint lo, a_ptrint to_commit ) 

***************************** ****************** I 

{ 

a_ptrint hi = _config._current._n_infos; 
for( ; lo < hi && to_commit > 0; ++lo ) { 
a_ptrint tagged = 0; 

for(; tagged < to_commit && lo + tagged < hi && _info[lo+tagged].CanCommit(); ++tagged ); 
if( tagged > 0 ) { 

aj)trint alignedjo = round_up_ordinal( lo ); 

aj3trint aligned_hi = round_down_ordinal( lo + tagged ); 

if( alignedjo < aligned_hi ) { 
a_ptrint count = _images.commit( alignedjo, aligned_hi - alignedjo ); 
for( a_ptrint i = 0; i < count; ++i ) { 

_i nf o[al ig ned Jo + i] . Co m m itted () ; 

} 

_config._current._n_committedJmages += count; 
reco m pu te_head roo m () ; 
to_commit -= count; 
} 

lo += tagged; 

} 

} 

return( to_commit ); 

} 

a_bool 

Cache::Growlnfos( a_ptrint to_commit ) 

I********** ******ie******* ************ I 



a_ptrint original = _config._current._n_infos; 
a_ptrint requested = original + to_commit; 
if( recommit( Jnfo, original, requested, sizeof(Pagelnfo) ) ) { 
for( a_ptrint ordinal = original; ordinal < requested; ++ordinal ) { 
new (&_info[ordinal]) Pagelnfo( ordinal_toJmage( ordinal ) ); 

} 

_config._current._n_infos = requested; 
return( TRUE ); 
} 

return( FALSE ); 

} 

a_bool 

Cache::recommit( void *p, a_ptrint old_count, a_ptrint new_count, a_ptrint item_size ) 
********************************************************** ************* I 

{ 

#if defined( DYNAMIC_CACHE_SIZE ) 

_assertD( (((a_ptrint)p)&(_os_page_size-1)) == 0 ); 
_assertD( item_size <= _os_page_size ); 

a_ptrint old_size = (a_ptrint) _round_up_pow2( old_count * item_size, _os_page_size ); 

a_ptrint new_size = (a_ptrint) _round_up_pow2( new_count * item_size, _osj3age_size ); 

if( new_size > old_size ) { 
return( Vmem_commit( ((char *)p)+old_size, new_size-old_size ) ); 

} else if( new_size < old_size ) { 
return( Vmem_decommit( ((char *)p)+new_size, old_size-new_size ) ); 

} 

#else 

_unused( p ); 

_unused( old_count ); 

_unused( new_count ); 

_unused( item_size ); 
#endif 

return( TRUE ); 

} 

// PJB FIXME: Next two routines not quite right. 

a_bool 

Pagelnfo::CanCommit() 
^******************* I 

{ 

return( IsMissinglmageQ ); 

} 

void 

Pagel nf o : :Committed() 

^******************* I 

{ 

MarklmageAsAvailableO; 

} 

#if defined( DYNAMIC_CACHE_SIZE ) 
void 

Cache: :after_cache_size_change() 

^***** ************** ***********^ 



{ 

SetPageScoringParametersO; 
a_ptrint size_in_k = current_cache_size()/1024; 
_engine_statistic_set( CURRENT_CACHE_SIZE, size_in_k ); 
if( size_in_k > *_engine_counter( PEAK_CACHE_SIZE ) ) { 
_engine_statistic_set( PEAK_CACHE_SIZE, size_in_k); 
} 

DB_Message( IDS_ENG_CACHE_SIZE_CHANGED, size_in_k); 
#if IPRODUCTION 
LSBuf msg; 
#if defined( ALLOW_CACHE_TO_SHRINK ) 

a_ptrint minjnfos = DynamicCacheConfig::minimum_nJnfos(_config._current._n_committe^^^ ); 
if(_config._current._n_infos > minjnfos ) { 
sprintf( msg, "Cache config: %\6 images, %lcl[%ld ideal] infos", 
_config._current._n_committed_images, _config._current._n_infos, minjnfos ); 
DB_Message( msg ); 
return; 
} else 
#endif 

{ 

sprintf( msg, "Cache config: %ld images, %ld infos", 
_config._current._n_committedJmages, _config._current._nJnfos ); 
DB_Message( msg ); 
} 

#endif 

} 

#if defined( ALLOW_CACHE_TO_SHRINK ) 
a_bool 

Pagel nfo : : lsShhnkable() 

***************** ^ 

{ 

return( jaending == NULL && IJs.dirty && !lsLatched() ); 

} 

a_bool 

Cache: :lsShhnkable( Pagelnfo * info ) 

^***** ************** ***************** ^ 

{ 

if( !info->lsShrinkable() ) { 
return( FALSE ); 

} 

if( info->lslnHash() ) { 
a_cache_name name = info->name(); 
CacheChain * chain = ChainFor( name ); 

for( CacheRef * ref = chain->_refs; ref != NULL; ref = ref->_next ) { 

if( ref->_name.as_uint == name.as_uint ) { 
return( FALSE ); 
} 

} 

} 

return( TRUE ); 



} 

#if IPRODUCTION 
unsigned fake_out_opt; 
void 

Cache: :debug_images() 

^******************* I 

{ 

for( a _ptrint i = 0; i < avail_infos(); ++i ) { 
if( !_info[i].lsMissinglmage() ) { 
fake_out_opt += * (unsigned *) Unfo[i].Jmage); 

} 

} 

} 

#endif 
void 

Pagelnfo::Slirinl<( Cache * cm ) 

I**************************** I 
{ 

LatchO; 

if( IslnHashO ) { 
cm->RemoveFromHash( this ); 

} 

M arki m age As iVI iss i ng 0 ; 
_name.as_uint = BOGUS_NAME; 
UnlatchO; 

} 

a_ptrint 

Cache: :Decommit( a_ptrint lo, a_ptrint hi, aj3trint max ) 

******************************************* ******* I 

{ 

a_ptrint alignedjo = round_up_ordinal( lo ); 

a_ptrint aligned_hi = round_down_ordinal( hi ); 

if( aligned_hi < aligned_lo ) aligned_hi = alignedjo; 

a_ptrint count = aligned_hi - alignedjo; 

if( count > max ) count = max; 

if( count > 0 ) { 
debug JmagesO; 
alignedjo = aligned_hi - count; 
Jmages.decommit( alignedjo, count ); 
_config._current._n_committedJmages -= count; 
recompute_headroom(); 
for( a_ptrint i = 0; i < count; ++i ) { 

Jnfo[alignedJo + i].Shrink( this ); 

} 

if( aligned_hi == _config._current._nJnfos ) { 

_config._current._nJnfos = alignedjo; 

for( a_ptrint i = 0; i < count; ++i ) { 
Jnfo[alignedJo + i].~Pagelnfo(); 

} 

recommit( Jnfo, aligned_hi, alignedjo, sizeof(Pagelnfo) ); 



} 

debugJmagesO; 
} 

return( count ); 

} 

a_ptrint 

Cache::FindRange( a_ptrint hi, a_bool is_shrinkable ) 

***************************** ***************** I 

{ 

while( hi-- > 0 ) { 
if( lsShrinkable( &_info[hi] ) != is_shrinkable ) break; 
} 

return( hi + 1 ); 

} 

void 

Cache: :shrink_images( ajDtrint to_decommit ) 

^***** ***************************** ******** I 

{ 

_assertD( !awe_enabled() ); 

to_decommit = round_down_ordinal( to_decommit ); 

a_ptrint lo = _config._current._n_infos; 

while( to_decommit > 0 && lo > 0 ) { 
a_ptrint hi = FindRange( lo, FALSE ); 
lo = FindRange( hi, TRUE ); 
to_decommit -= Decommit( lo, hi, to_decommit ); 

} 

} 

a_bool 

Cache: :shrink_cache( DynamicCacheConfig &new_config ) 

^***** ***************************** ***************** I 

{ 

_assertD( !awe_enabled() ); 

a_ptrint committed = _config._current._n_committed_images; 

if( new_config._n_committed_images > committed ) { 
// Even though the cache size has decreased, it may cause the number of 
// images to increase due to other structures decreasing in size and 
// due to the way in which we compute the size of the various cache 
// components. All non-image components must shrink or remain the same 
// size. 

return( FALSE ); 
} 

// It is safe to wait for all lOs to complete while in SuperForbid state 

// because no worker can be doing synchronous lO if we are SuperForbidding 

// and the current worker can handle the completion of all async lOs 

DIO_Wait_all(); 

shrink_images( committed - new_config._n_committed_images ); 
_reusable.Resize( this, new_config._n_reusable ); 
_config._current._n_reusable = new_config._n_reusable; 
//PJBTODO: fix check. 
#if IPRODUCTION && 0 



CacheChain *chain; 
for( i=0; i<_hash_max; i++ ) { 
chain = &_page_hash[i]; 

for( info=chain->_heacl; info; info=info->_next ) { 
_assertD( info < maxjnfo ); 

} 

} 

#enclif 

// update the queues with meaningful info 

after_cache_size_change(); 

return( TRUE ); 

} 

#enclif // ALLOW_CACHE_TO_SHRINK 
a_ptrint 

Cache::Growlmages( a_ptrint to_commit ) 

^************************************* I 

{ 

a_ptrint orig = _config._current._n_infos; 
if( Growlnfos( to_commit ) ) { 
to_commit = Commitlmages( orig, to_commit ); 
} 

return( to_commit ); 

} 

a_bool 

Cache: :grow( a_ptrint to_commit ) 
{ 

a_ptrint requested = to_commit; 
to_commit = Commitlmages( 0, to_commit ); 
if( to_commit > 0 ) { 
to_commit = Growlmages( to_commit ); 
} 

return( to_commit != requested ); 

} 

a_bool 

Cache: :grow_cache( DynamicCacheConfig &new_config ) 

II Must be holding _cache_growth_mutex 
{ 

DynamicCacheConfig old_config; 
old_config = _config._current; 

if( new_config._n_committed_images < old_config._n_committed_images ) { 
// Even though the cache size has increased, it may cause the number of 
// images to decrease due to other structures increasing in size and 
// due to the way in which we compute the size of the various cache 
// components. All non-image components must grow or remain the same size. 
return( FALSE ); 

} 

_reusable.Resize( this, new_config._n_reusable ); 
_config._current._n_reusable = new_config._n_reusable; 



// If there are holes in the image array then _n_infos may need to 
// remain larger than number of images in the desired new configuration 
new_config._n_infos = _max( new_config._n_infos, old_config._n_infos ); 
if( !grow( new_config._n_committed_images - old_config._n_committed_images ) ) { 
return( FALSE ); 

} 

// update the queues with meaningful info 

after_cache_size_change(); 

return( TRUE ); 

} 

a_bool 

Cache: :grow_cache_by_images( a_ptrint images_to_add ) 

^*************************************************** I 

II Must already hold the _cache_growth_mutex 
{ 

// If we try to grow the cache by too small a value, the rounding 
// of the sizes of the various cache data structures may not 
// result in an increase in the number of images available 
if( awe_enabled() ) { 
return( FALSE ); 
} 

#define MIN_IMAGES_TO_ADD 64 

images_to_add = _max( images_to_add, MIN_IMAGES_TO_ADD ); 
images_to_add = round_up_ordinal( images_to_add ); 
DynamicCacheConfig config = _config._current; 
config._n_committed_images += images_to_add; 
if( config._n_committed_images > config._n_infos ) { 
config._n_infos = config._n_committed_images; 
} 

config._n_reusable = config._nJnfos; 
if( config.cache_size() > maximum_cache_size() ) { 
return( FALSE ); 
} 

return( grow_cache( config ) ); 

} 

a_bool 

Cache: :resize_cache( uint64 newsize ) 

******************* *********** I 

II Do the best we can to make the cache size approximately "newsize". 

// Returns true if cache size changed 

{ 

a_bool changed; 
DynamicCacheConfig config; 
if( awe_enabled() ) { 
return( FALSE ); 

} 

newsize = _max( newsize, minimum_cache_size() ); 
newsize = _min( newsize, maximum_cache_size() ); 
config. recompute( newsize ); 
if( config.cache_size() > maximum_cache_size() || 



config.cache_size() < minimum_cache_size() ) { 
return( FALSE ); 
} 

_cache_growth_mutex.get(); 

if( config.cache_size() > current_cache_size() ) { 

// We cannot SuperForbidO when growing the cache because 

// we may be trying to grow the cache in a panic in which case 

// we may have pages locked that other tasks are waiting for 

changed = grow_cache( config ); 

_cache_growth_mutex.give(); 
} else if( config.cache_size() < current_cache_size() ) { 

_cache_growth_mutex.give(); 

#ifdef ALLOW_CACHE_TO_SHRINK 

// Note: _config._current can change here but we cannot hold the 
// _cache_growth mutex when we call SuperForbid because one of the 
// workers may be trying to grow the cache (possibly in a panic) 
SuperForbidO; 

// Note that nobody can be holding the _cache_growth_mutex at this point 
if( config.cache_size() < current_cache_size() ) { 
changed = shrink_cache( config ); 
} 

SuperPermitO; 
#else 

changed = FALSE; 
#endif 

} else { 

_cache_growth_mutex.give(); 
changed = FALSE; 
} 

return( changed ); 

} 

#else 
a_bool 

Cache: :resize_cache( uint64 newsize ) 

^*********************************** ^ 

{ 

_unused( newsize ); 
return( FALSE ); 

} 

#endif 
a_ptrint 

Cache: :cache_available_images() 
{ 

a_ptrint total = avail_infos(); 
a_ptrint pinned =_pinned_images; 
return( total > pinned? total - pinned : 0 ); 

} 

a_ptrint 

Cache: :cache_available_addr() 



^*************************** I 

{ 

#if clefinecl( AWE_CACHE ) 

if( awe_enabled() ) { 
return( j3innedjmages < _awe_cache._adclr_space 
? (_awe_cache._addr_space - _pinned_images)*_db_page_size_max 
:0); 
} 

#endif 

return( cache_available_images() ); 

} 

a_bool 

Cache: :enough_pages_available( uint32 num_pages, a_bool grow_cache_if_necessary ) 
********************************************************** I 

II Assumes that the caller is looking to grow a large, locked heap so we care 

// that enough *address* space is available for the number of pages 

{ 

#if defined( DYNAMIC_CACHE_SIZE ) 

if( cache_available_addr() >= num_pages ) { 
return( TRUE ); 
} 

if( !grow_cacheJf_necessary || awe_enabled() ) { 
return( FALSE ); 
} 

_cache_growth_mutex.get(); 

a_ptrint avail = cache_available_addr(); 

if( avail >= num_pages ) { 
_cache_growth_mutex.give(); 
return( TRUE ); 

} 

grow_cache_by_images( numjaages - avail ); 
a_bool enough = ( cache_available_addr() >= num_pages ); 
_cache_growth_mutex.give() ; 
return( enough ); 
#else 

_unused( grow_cache_if_necessary ); 

return( cache_available_addr() >= num_pages ); 
#endif 
} 

#if IPRODUCTION 

// Use this routine like BMem in dballoc.c. 
typedef struct mp_alloc { 

struct mp_alloc *next; 

void *contents; 

a_debug_count count; 
} mp_alloc; 

mp_alloc *MultiPageAllocs = NULL; 
atomic32 MultiPageCount = 0; 
a_debug_count WMPmem = 0; 
static void BMPmem( a_debug_count watch ) 



r*************************************** 



II Set WMPmem to the count you want, then set a breakpoint at BMPmem 
{ 

WMPmem = watch; // prevent optimizer from merging functions 

} 

static void CheckMultiPageAllocs() 

II Verify that all multi-page allocations have been freed. 
{ 

_assertD( MultiPageAllocs == NULL ); 

} 

#endif 

Cache: :~Cache() 
{ 

unsigned i; 

_db_declare_yield( DBFINIHASH1, 30 ); 
#if defined( DYNAMIC_CACHE_SIZE ) 

if( _auto_resize != NULL ) { 
delete _auto_resize; 

} 

#endif 

DV_Fini(); 

#if IPRODUCTION 
CheckMu Iti PageAllocs() ; 

#endif 

for( i=0; i < _hash_max; ++i ) { 
/* Must call destructor to destroy Mutex - in Netware, open semaphores 

are not closed by the OS, and if we don't do it, the OS crashes. 7 
_page_hash[i].~CacheChain(); 
_db_yield( DBFINIHASH1 ); 

} 

#if defined( AWE_CACHE ) 

free( _frame_owner ); 
#endif 
} 

a_bool 

CM_lnit( p_engine_parms ep ) 

{ 

if( ep->page_bits < MIN_CACHE_PAGE_BITS ) { 
ep->page_bits = MIN_CACHE_PAGE_BITS; 
} 

return( (new Cache( ep, AWECache::Alloclnterface( ep ) ))->lsUpAndRunning() ); 

} 

void 

CM_Fini() 
{ 

delete CM; 



} 

#if defined(DYNAMIC_CACHE_SIZE) 
a_bool 

Cache: :suspend_resizing() 
****************** I 

{ 

if( _auto_resize != NULL ) { 

_auto_resize->suspend(); 

return TRUE; 
} else { 

return FALSE; 

} 

} 

a_bool 

Cache::resume_resizing() 

I********************** I 

{ 

if( _auto_resize != NULL ) { 

_auto_resize->resume(); 

return TRUE; 
} else { 

return FALSE; 

} 

} 

a_bool 

Cache: :resizing_suspended() const 

I******************************* I 

{ 

if( _auto_resize != NULL ) { 

return _auto_resize->suspended(); 

} else { 

return FALSE; 

} 

} 

#endif 

a_bool CM_ResizeCache( uint64 newsize ) 
I************************************* I 

{ 

a_bool ret = XM->resize_cache( newsize ); 
#if defined(DYNAMIC_CACHE_SIZE) 

XM->suspend_resizing(); 
#endif 

return ret; 

} 

a_bool CM_ResumeResizing() 

I************************ I 

{ 

#if defined(DYNAMIC_CACHE_SIZE) 

return( XM->resume_resizing() ); 
#else 



return TRUE; 
#enclif 
} 

uint64 CM_CurrentCacheSize() 
************** ******* I 

{ 

return( XM->current_cache_size() ); 

} 

uint64 CM_MinimumCacheSize() 

I************************** I 

{ 

return( XM->minimum_cache_size() ); 

} 

uint64 CM_MaximumCacheSize() 

I************************** I 
{ 

return( XM->maximum_cache_size() ); 

} 

a_bool 

CM_EnoughPagesAvailable( uint32 num_pages, a_bool grow_cache_if_necessary ) 

I************************************************************************* I 

{ 

return( XM->enough_pages_available( num_pages, grow_cache_if_necessary ) ); 

} 

a_ptrint 

Cache: :likely_available() 

I*********************** I 

II Assumes that the caller is looking to grow a large, locked heap so we care 

// that enough *adclress* space is available for the number of pages 

{ 

#if defined(DYNAMIC_CACHE_SIZE) 
if( resizing_suspended() ) { 

return( cache_available_addr() ); 
} else { 

return( cache_available_addr() +_headroom ); 

} 

#else 

return( cache_available_addr() + _headroom ); 
#endif 
} 

a_ptrint 

CM_LikelyAvailable() 

I****************** I 

{ 

return( XM->likely_available() ); 

} 

#if IPRODUCTION 

static void sem_clump( void ) 

// Dump latches to a file, hit the debugger. 



{ 

KSem_clump(); 
_assertD( FALSE ); 

} 

#if 0 // unused 

static void DbgPageLock( void ) 

^***************************** I 

{ 

#if 0 

// Keep track of number of page locks owned by current task. 

++_taskData( pagejocks ); 
#endif 
} 

static void DbgPageUnlock( Pagelnfo *info ) 

***************************** ******** I 

{ 

#if 0 

// Keep track of number of page locks owned by current task. 
// _assertD( _taskData( pagejocks ) != 0 ); 
if( _taskData( pagejocks ) == 0 ) { 
sem_dump(); 

} 

JaskData( pagejocks )--; 

// Do some page consistency checks on table pages if they have been 

// modified. 

info->Jile->consistency_check( frame->Jmage, info->_owner != NULL ); 
#eise 

_unused( info ); 
#endif 
} 

#endif // unused 
void 

CM_AssertNoPageLocks( void ) 

^***** ************** ******* I 

{ 

if( JaskData( pagejocks ) != 0 ) { 
sem_dump(); 
} 

} 

#endif 

#if IPRODUCTION 
void 

Cache: :CacheError( Pagelnfo *info, a_cache_error error ) 

^***** ******************************************* ******y 

{ 

char *msg; 
switch( error ) { 

case CACHE_ERR_WRITE_LOCK: 
msg = "modified without write lock"; 
break; 



case CACHE_ERR_UNLOCK: 
msg = "cannot be unlocked"; 

break; 

case CACHE_ERR_STILL_LOCKED: 
msg = "left locked"; 
break; 

default: 
msg = "Unknown error"; 

} 

#if !defined( UNDER_CE ) 

// Cache page num is wrong for SEGMENTED_CACHE, but don't worry about it 
// PJB FIXME: Add locking info back to msg 
char buf[256]; 

sprintf( buf, "cache page %d (page %ld) %s\n", 
ordinal( info ), 

info->_file->getj3age_no( info->Jmage ), 
msg ); 

DB_Message( buf ); 
#else 

_unused( info ); 

OutputDebugString( msg ); 
#endif 

_assertP( 101402, FALSE, 
"Cache error" ); 

} 

void 

Cache: :CheckForLockedPages( int db_no ) 

^***** ************** ****************** I 

{ 

#if 1 

//PJB FIXME: Implement. Note that pages can be locked by other 
// threads attempting to claim page. 
_unused( db_no ); 

#else 

for( a_ptrint i = 0; i < avail_infos(); i++ ) { 
Pagelnfo * info = &_info[i]; 
if( Lis_temporary( info->page_no() ) 

&& info->db_no() == db_no && info->lsLocked() ) { 

CacheError( info, CACHE_ERR_STILL_LOCKED ); 

} 

} 

#endif 
} 

void 

Cache::ChecklfStillUsedAtFileDrop( a_database_number db_no, unsigned file_no ) 

I**************************************************************************** I 

{ 

// Check to see if any pages are still in use. 
for( a_ptrint i = 0; i < availJnfosO; i++ ) { 
Pagelnfo * info = &_info[i]; 



if( info->db_no() == clb_no 

&& _file_num( info->page_no() ) == file_no ) { 

// PJB FIXME: Wrong error constant. 

CacheError( info, CACHE_ERR_STILL_LOCKED ); 

} 

} 

} 

#enclif 

llllllllllllllllllllllllllllllllllllllllllllllllllllllllllllllllllll^ 
void 

CacheRef : :Remove() 

^****************^ 

{ 

CacheChain * chain; 

while( (chain = _chain) != NULL && !chain->Remove( this ) ); 

} 

void 

CacheRef:: Latch ( a_bool shared ) 
******************* ****** I 

{ 

Page Info * info; 

for( ;; ) { 
a_cache_name name = _name; 
// PJB FIXME: abstract 
if( _chain == NULL ) return; 
info = Jnfo; 

if( info == NULL || !info->Latch( XM, name, shared ) ) { 
if( _chain == NULL ) return; 
if( _name.as_uint 1= name.as_uint ) continue; 
info = XM->lnstall( name, shared ); 

} 

info->FinishLock( shared ); 
if( _name.as_uint == info->name().as_uint ) break; 
info->Unlock(); 
Jnfo = NULL; 
} 

Jnfo = info; 
_assertD( IJs. locked ); 
Js. locked = TRUE; 

} 

CacheChain * 

CacheRef: :LatchChain() const 

^***** ************** *^ 

{ 

CacheChain * chain; 

while( (chain = _chain) 1= NULL ) { 
chain->Latch(); 
if( _chain == chain ) break; 
chain->Unlatch(); 

} 



return( chain ); 

} 

void 

CacheRef::Unlock() 
^**************** I 

{ 

if( Js. locked ) { 
Js. locked = FALSE; 
_info->Unlock(); 

} 

} 

void 

CacheRef::releaseRefs() 
I********************* I 

{ 

if(_chain != NULL ) { 
if( Js. locked ) { 

_chain->Remove( this ); 

UnlockO; 
} else { 

RemoveO; 

} 

} 

_assertD( Ms. locked ); 
Jnfo = NULL; 

_name.as_member.page_no = NULL_PAGE; 

} 

void 

CacheRef::clone( CacheRef const & ref ) 

************** ****************** I 

{ 

CacheChain * chain = ref.LatchChain(); 

if( chain != NULL ) { 
_chain = chain; 
Jnfo = ref .Jnfo; 
Jndex = ref.Jndex; 
JIags = ref.Jlags; 
Js.locked = FALSE; 
_name = ref._name; 
_next = chain->_refs; 
chain->_refs = this; 
chain->Unlatch(); 

} else { 
_chain = NULL; 
Jnfo = NULL; 

_name.as_member.page_no = NULL_PAGE; 
Jndex = ref.Jndex; 
JIags = ref.Jlags; 
Js.locked = FALSE; 
} 



} 

CacheRef::CacheRef( CacheRef const & ref ) 

^**************************************** I 
{ 

clone( ref ); 

} 

CacheRef& 

CacheRef: :operator=(CacheRef const & ref ) 
***************************** ****** I 

{ 

if( this != &ref ) { 
releaseRefsO; 
clone( ref ); 

} 

return *this; 

} 

void 

Cache: :Acld( CacheRef * ref ) 
^************************** I 

{ 

CacheChain * chain = ChainFor( ref->_name ); 

ref->_chain = chain; 

chain->Latch(); 

ref->_next = chain->_refs; 

chain->_refs = ref; 

chain->Unlatch(); 

_assertD( ref->_next != ref ); 

} 

void 

CacheRef: :force( Pagelnfo *info ) 

^***** ************** ************* I 

{ 

Jnfo = info; 
_name = info->name(); 
Jndex = 0; 
JIags = 0; 

_is.pinned_to_page = TRUE; 
Js. locked = TRUE; 
XM->Add( this ); 

} 

void 

CacheRef: :force( Pagelnfo *info, a_page_count index ) 
^***** ***************************** ****************** I 

{ 

Jnfo = info; 

_name = info->name(); 

Jndex = index; 

JIags = 0; 

Js. locked = TRUE; 

XM->Add( this ); 



} 

void 

CacheRef::Aclcl( a_cache_name name, a _page_count index ) 
***************************** ****************** I 

{ 

_name = name; 
Jndex = index; 
XM->Add( this ); 

} 

CacheRef::CacheRef( a_database_number db_no, a_page_id page_no ) 

^***** ******************************************* ************** I 

{ 

Jnfo = NULL; 
_flags = 0; 

_name = NameFor( db_no, page_no ); 

if( page_no == NULL_PAGE ) { 
_chain = NULL; 

} else { 
Jndex = 0; 

_is.pinned_to_page = TRUE; 
Add( _name ); 
} 

} 

CacheRef::CacheRef( a_database_number db_no, a_record_id const & id ) 

^***** ************************************************ ************** I 

{ 

Jnfo = NULL; 
Set( db_no, id ); 

} 

void 

CacheRef::Set( a_database_number db_no, a_recordJd const & id ) 
^***** ************************************************ ********* I 

{ 

JIags = 0; 

_name = NameFor( db_no, id.page_no() ); 

if( _name.as_member.page_no == NULL_PAGE ) { 
_chain = NULL; 

} else { 
Add(_name, id.index() ); 

} 

} 

void 

CacheRef::Latch( a_cache_name name, a_bool shared ) 

^***** ******************************************* *^ 

{ 

_assertD( _chain == NULL ); 

if( name.as_member.page_no == NULL_PAGE ) { 

releaseRefsO; 

} else { 
JIags = 0; 



Aclcl( name, 0 ); 
Latch( shared ); 
} 

} 

a_bool 

CacheRef::move_to( a_pagejcl page_no, a_page_count index ) 

// Move a reference to (page_no, index). The reference must currently 

// lock a page that contains a pointer to the new page. 

{ 

if( page_no == NULL_PAGE ) { 
releaseRefsO; 
Jndex = index; 
return FALSE; 

} else { 
Page Info *jnfo = Jnfo; 
_chain->Remove( this ); 

Add( NameFor( info->db_no(), page_no ), index ); 
Js.locked = FALSE; 
info->Unlock(); 
return TRUE; 
} 

} 

void 

CacheRef::lock_couple( a_pagejd page_no, a_bool shared ) 

^*******************************************************^ 

// Set reference to (and get a read lock on) new_page_no while holding 

// onto lock on existing page. 

{ 

Pagelnfo *info = Jnfo; 
_chain->Remove( this ); 

Latch( NameFor( info->db_no(), page_no ), shared ); 

info->Unlock(); 

mark_dirty( shared ); 

} 

// Stubs, 
void 

DIO_Async_init() 

^**************^ 

{ 
} 

void 

DIO_Async_fini() 

{ 
] 

void 

DIO_Wait_all() 

{ 



// PJB FIXME: see if we can eliminate. 
XM->WaitAII( NO_DB_ID ); 

} 

// PJB TODO: Eliminate these routines, 
void 

Cachelnfo::mark_clirty() 
{ 

((Pagelnfo *) this)->mark_dirty(); 

} 

void 

Cachelnfo::unlock() 
{ 

((Pagelnfo *) this)->unlock(); 

} 

void 

Cachel nf o : :write_to_read_lock() 
{ 

((Pagelnfo *) this)->ExclusiveToShared(); 

} 

a_bool 

Cachel nf o : : read_to_write_lock() 
{ 

a_bool success = ((Pagelnfo *) this)->TrySharedToExclusive(); 
if( success ) { 
mark_dirty(); 
} 

return ( success ); 

} 

void 

CacheRef : :u nlock_page() 

^********************* I 

{ 

UnlockO; 

} 

iiiiiiiiiiiiiiiiiiiiiiiiiiiiiiifiiiiiiiiiiiiiiiiiiiiiiiiiiiiiiiiiiiniiiiiiim 

II Maintain an array of lOCBs. Scan to find free element, if we have 
//a ticket. Claim element with atomic operation. If we need to wait 
// for an lOCB, we pick a victim and wait? Should we keep track of 
// the number of outstanding lOs? 
#define IDLE_IO_DELAY 30 
void 

Cache::PrelO() 
{ 

_io.idle_timer.arm( -1 ); 

} 

void 

Cache::PostlO() 

{ 



// don't need to slow this down in low power mode 
_io.idle_timer.arm( IDLE_IO_DELAY ); 

} 

Cache::IOGIobals::IOGIobals() 
************** ******** I 

{ 

_engine_statistic_set( AVAILJO, MAXJOCB ); 

} 

a_bool 

Cache:: Wait Any 0 

I************** I 

{ 

for( unsigned i = 0; i < MAXJOCB; ++i ) { 
lOCB * iocb = &_io.iocb[i]; 
Pagelnfo * info; 

if( (info = iocb->_info) != NULL && info->TryLatch() ) { 
if( info->_pending == iocb && iocb->TryLatch() ) { 

iocb->DoFinish( info, TRUE, TRUE ); 

iocb->Unlatch(); 

info->Unlatch(); 

return( TRUE ); 
} 

info->Unlatch(); 

} 

} 

return( FALSE ); 

} 

void 

Cache: :WaitAII( a_database_number db_no ) 

I*************************************** I 

{ 

for( unsigned i = 0; i < MAXJOCB; ++i ) { 
IOCB * iocb = &Jo.iocb[i]; 
Pagelnfo * info; 

while( (info = iocb->Jnfo) != NULL ) { 

if( db_no == NO_DB_ID || info->db_no() == db_no ) { 
info->Latch(); 

if( db_no == NO_DBJD || info->db_no() == db_no ) { 

if( info->_pending == iocb ) { 
iocb->Latch(); 

iocb->DoFinish( info, TRUE, TRUE ); 
iocb->Un latch (); 
} 

} 

info->Unlatch(); 

} else { 
break; 

} 

} 

} 



void 

Cache: :WaitForExtencl( Pagelnfo * extend ) 
************** ******************** I 

II This will need to be modified if we add support for gather writes. 
{ 

a_database_number db_no = extend->_file->db->id(); 

a_page_id page_no = extend->page_no(); 

for( unsigned i = 0; i < MAXJOCB; ++i ) { 
lOCB * iocb = &_io.iocb[i]; 
Pagelnfo * info; 

if( (info = iocb->Jnfo) != NULL ) { 

a_cache_name name = info->name(); 

if( name.as_member.db_no == db_no && name.as_member.page_no >= page_no ) { 
if( info->Latch( this, name ) ) { 
if( info->_pending == iocb ) { 
iocb->Latch(); 

iocb->DoFinish( info, TRUE, TRUE ); 
iocb->Un latch (); 
} 

info->Unlatch(); 

} 

} 

} 

} 

} 

void 

Cache: :WaitUntilClean( IDatabaseFile * file ) 

^***** ***************************** ********* I 

II This will need to be modified if we add support for gather writes. 
{ 

for( unsigned i = 0; file->dirty_pages != 0 && i < MAXJOCB; ++i ) { 
IOCB * iocb = &_io.iocb[i]; 
Pagelnfo * info; 

if( (info = iocb->Jnfo) != NULL ) { 

a_cache_name name = info->name(); 
if( info->file() == file ) { 
if( info->Latch( this, name ) ) { 
if( info->_pending == iocb ) { 
iocb->Latch(); 

iocb->DoFinish( info, TRUE, TRUE ); 
iocb->Un latch (); 
} 

info->Unlatch(); 

} 

} 

} 

} 

_assertP( 101415, file->dirty_pages == 0, "File still dirty" ); 

} 



lOCB* 

Cache::GetlOCB( Pagelnfo * info ) 

^*******************************^ 
{ 

lOCB * iocb; 

for( ;; ) { 

iocb = &Jo.iocbUo.rover++%MAX_IOCB]; 
Pagelnfo * donor; 

if( (donor = iocb->_info) == NULL ) { 

if( iocb->TryLatch() ) { 
if( iocb->_info == NULL ) break; 
iocb->Unlatch(); 

} 

} else if( donor->TryLatch() ) { 

// NB: iocb could be held while building a scatter read. 

if( donor- >_pending == iocb && iocb->TryLatch() ) { 
iocb->DoFinish( donor, TRUE, TRUE ); 
if( iocb->_info == NULL ) { 

donor->Unlatch(); 

break; 

} 

iocb->Unlatch(); 
} 

donor->Unlatch(); 

} 

} 

iocb->_io_type = _taskData( io_req_type ); 
iocb->_info = info; 
iocb->_mask = 1 ; 

_engine_statistic_add( AVAILJO, -1 ); 
// PJB TODO: 
return( iocb ); 

} 

a_bool 

IOCB::Finish( Pagelnfo * info, a_bool wait, a_bool respect_evict ) 

^****************************************************************^ 

{ 

a_bool success = DoFinish( info, wait, respect_evict ); 
U n latch 0; 
return( success ); 

} 

a_bool 

IOCB::Finish( a_bool wait, a_bool respect_evict ) 

^*********************************************** I 

{ 

II PJB FIXME: what about latching Jnfo? 
return( Finish(_info, wait, respect_evict ) ); 

} 

a_bool 

IOCB::DoFinish( Pagelnfo * info, a_bool wait, a_bool respect_evict ) 



r***** ******************************************* ****************** 



// Might have "shared" access to page if waiting for shared access to 

// page being written. 

{ 

_assertD( info->_pending == this ); 

if( !wait_for_io( Task::me(), wait ) ) { 
_assertD( !wait ); 
return( FALSE ); 

} 

if( IsWriteO ) { 

_assertD( info == Jnfo ); 
if( WaitedO ) { 

_db_statistic_incr( db, NULL, DISK_WAITWRITE ); 

} 

info->w_complete(); 

if( _is.to_be_evicted && respect_evict ) { 
// must have exclusive access if we are to evict 
_assertD( info->HaveExclusively() ); 
XM->RemoveFromHash( info ); 
_is.to_be_evicted = FALSE; 

} 

Jnfo = NULL; // Gather writes not supported. 

} else { 
if( WaitedO ) { 

_db_statisticjncr( db, NULL, DISK_WAITREAD ); 

switch ( _io_type ) { 

case IOREQ_OPTIM : 
_db_statistic_incr( db,NULL,WAITREAD_OPTIM ); break; 

case IOREQ_TEMPTAB : 
_db_statistic_incr( db,NULL,WAITREAD_TEMPTAB ); break; 

case IOREQ_FULLCOMP : 
_db_statistic_incr( db,NULL,WAITREAD_FULLCOMP ); break; 

default : 

_db_statistic_incr( db,NULL,WAITREAD_UNKNOWN ); 
} 

} 

info->r_complete(); 
if( _mask == 1 ) { 

Jnfo = NULL; 
} else if( info == _info ) { 

a_cache_name name = info->name(); 

do{ 

name.as_member.page_no++; 

_mask »= 1 ; 
} while( (_mask&1) == 0 ); 

Jnfo = XM->ChainFor( name )->AssuredFind( name ); 
} else { 

_mask&= -(1 « (info->page_no() - Jnfo->page_no())); 

} 

} 



if( info == NULL ) { 
_engine_statistic( AVAIL_IO ); 
} 

// A failed lO may have completed on another thread 
Su icideOn Fatal Error() ; 

// PJB FIXME: should we pass pointer to wait 

// counter? Guaranteed that only one waiter from 

// upper levels (owner of lOCB). Should do wait_for_io( me ). 

return( TRUE ); 

} 

a_bool 

IOCB::lsActuallyPending( void ) 

^***************************** I 

{ 

#if defined( UNDER_CE ) 

return FALSE; 
#elif defined( WINNT) 

return _state.pending_io; 
#else 

return _state.as_member.pendingJo; 
#endif 
} 

void 

Cache: :AddToReusable( Pagelnfo * info ) 

******************* ************* I 

{ 

if( !info->lsMissinglmage() ) { 
_assertD( info->HaveExclusively() && !info->lslnHash() ); 
info->_name.as_uint = BOGUS_NAME; 
if( info->_pending != (lOGB *) Pagelnfo "REUSABLE ) { 

_assertD( info->_pending == NULL ); 

info->_pending = (lOCB *) Pagelnfo::REUSABLE; 

} 

#if SUPPORT_CACHE_COLDSTART 
info->SetColdstartRecorded( FALSE ); 
#endif 

_reusable.Enqueue( info ); 
} 

} 

Pagelnfo * 

Cache: :AllocReusable() 
^******************** I 

{ 

Pagelnfo * info = _reusable.Dequeue(); 
if( info && info->TryLatch() ) { 
if( info->lsReusable() ) { 

info->j)ending = NULL; 

return info; 

} 

info->Unlatch(); 



} 

return( NULL ); 

} 

// Page Info methods. 
Pagelnfo::~Pagelnfo() 

^********************* I 

{ 
} 

Pagelnfo::Pagelnfo( void * image ) 

: _next( NULL ) 

, _flags( 0 ) 
#if IPRODUCTION 

, first_lock( 0 ) 

, first_write( 0 ) 
#endif 

, _reaLpage_no( 0 ) 
#if clefined( CHECKSUM ) 

, checksum ( 0 ) 
#enclif 

, _pending( (lOCB *) IMAGE_MISSING ) 

{ 

_name.as_uint = BOGUS_NAME; 
Jmage = image; 

_is.preimage_may_not_be_committed = FALSE; 
#ifdef SUPPORT_CACHE_COLDSTART 

_is.coldstart_recorded = FALSE; 
#endif 
} 

a_bool 

Pagelnfo::CanPreventReuse() 

{ 

a_name_reuse_state state = _state; 

a_name_reuse_state new_state; 

while( state. bits. is_in_hash ) { 
new_state = state; 
new_state. bits . ref_cou nt++ ; 

if( CSwap( &_state.as_cell, &state.as_cell, new_state.as_cell ) ) return TRUE; 
} 

return FALSE; 

} 

a_bool 

Pagel nf o : : AllowReuse() 
{ 

a_name_reuse_state state = _state; 
a_name_reuse_state new_state; 
do{ 

new_state = state; 



new_state. bits . ref_cou nt-- ; 
} while( !CSwap( &_state.as_cell, &state.as_cell, new_state.as_cell ) ); 
return !state.bits.is_in_hash; 

} 

a_bool 

Pagelnfo::SetlnHash( a_bool in_hash ) 
^***********************************^ 

{ 

a_name_reuse_state state = _state; 
a_name_reuse_state new_state; 
do{ 

new_state = state; 

new_state.bits.is_in_hash = in_hash; 
} while( !CSwap( &_state.as_cell, &state.as_cell, new_state.as_cell ) ); 
return new_state.bits.ref_count == 0; 

} 

void 

Pagelnfo::RecordHit( Cache * cm ) 
^***** ************** ************ I 

{ 

unsigned now = cm->_now; 

if( (int) (now -_visited_at) > cm->_delta ) { 
_visited_at = now; 
a_prs_slot score = _score; 

_score = score >= MAX_SCORE? MAX_SCORE : score + 1 ; 
} 

} 

a_bool 

Pagelnfo::Latch( Cache * cm, a_cache_name name, a_bool shared ) 

^***** ************************************************ ******** I 

II Block only for pages named name. Returns TRUE if latch has been 
// obtained (FALSE => the name of the info might have changed). 
{ 

if( TryLatch( shared ) ) { 
if( HasName( name ) ) { 
RecordHit( cm ); 
return( TRUE ); 

} 

UnlatchO; 

} else if( HasName( name ) ) { 
if( Can Prevent ReuseO ) { 

a_bool recycle; 

if( HasName( name ) ) { 
Latch( shared ); 
recycle = AllowReuse(); 
if( HasName( name ) ) { 

_assertD( Irecycle ); 

RecordHit( cm ); 

return( TRUE ); 

} 



if( recycle && !lsPinnecl() ) { 

if( Ishared || TrySharedToExclusiveO ) { 
cm->AclclToReusable( this ); 

} 

} 

UnlatchO; 
} else { 

// We just lost a race trying to latch page 
// so let the cleaner pick up the page. 
AllowReuseO; 
} 

} 

} 

return( FALSE ); 

} 

a_bool 

Pagelnfo::Scrub() 

^*************** I 

{ 

#if IPRODUCTION 

class lOCB * pending = _pending; 

_assertD( pending == NULL && HaveExclusively() ); 
#endif 

if( _is.tracked_tablej)age ) { 
_file->db->_pagectr->RemoveCachedPage( _tid, page_no(), !_is.blob_page ); 
_is.tracked_table_page = FALSE; 

} 

if( Js. dirty ) { 
Js.dirty = FALSE; 

_is.preimage_may_not_be_committed = FALSE; 
if( Us_temporary( _file->origin ) ) { 
_file->dec_dirty_pages(); 

} 

return( TRUE ); 
} 

return( FALSE ); 

} 

a_bool 

Cache: :RemoveFromHash( Pagelnfo * info ) 

^********** ************** ************** I 

{ 

CacheChain * chain = ChainFor( info->name() ); 
a_bool was_dirty = info->Scrub(); 
chain->Remove( info ); 
info->_name.as_uint = BOGUS_NAME; 
a_bool reusable = info->SetlnHash( FALSE ); 
if( reusable ) { 
AddToReusable( info ); 
} 

return( was_dirty ); 



} 

void 

Pagelnfo::PrepareForAdcl( a_cache_name name, unsigned now ) 

******************************************* ******** I 

II Prepare page for (possibly) going into cache. 
{ 

_visited_at = now; 
_score = 0; 
_name = name; 
_file = NULL; 

_assertD( !_is.tracked_table_page ); 
_real_page_no = name.as_member.page_no; 

} 

Pagelnfo * 

Cache: :AddToHash( CacheChain * chain, a_cache_name name, Pagelnfo * alloc ) 

^***** ********************************************************** **********^ 

{ 

alloc->PrepareForAdd( name, _now ); 
Pagelnfo * info = chain->FindOrlnsert( name, alloc ); 
if( info == alloc ) { 
info->SetlnHash( TRUE ); 

info->_pending = (lOCB *) Pagelnfo ::JUST_INSTALLED; 
++_now; 
} 

return( info ); 

} 

inline a_bool 

Pagelnfo ::lsReapable() const 

^***** ************** *^ 

{ 

return !j3ending; 

} 

void 

Pagel nfo : : Do Wait ForPending() 

^************************** I 

{ 

_assertD( !_is.preimage_may_not_be_committed ); 

TRACE( MultiSpindleWaitPending( 0 ) ); 

lOCB * iocb = _pending; 

if( iocb != NULL ) { 
iocb->Latch(); 
if( _pending == iocb ) { 

iocb->DoFinish( this, TRUE, FALSE ); 

} 

iocb->Unlatch(); 
} 

} 

void 

Pagel nfo ::PrepareForRead( IOCB * iocb ) 

^***** ************** ****************** I 



Database * db = _CurrentDB; 
// need to prepare for reading if shared 
_file = file_for_page( db, page_no() ); 
a_physical_page location = page_no() - _file->origin; 
if( location > db->DB_Max_physical_page_number ) { 
DB_Fatal( SQLSTATE_ACCESS_BEYOND_END_OF_MAX_DBSPACE, 
IDS_ENG_FMSG_ACCESS_BEYOND_END_OF_MAX_DBSPACE); 
} 

_reaLpage_no = page_no(); 

_assertD( !_is.preimage_may_not_be_committed ); 

_pending = iocb; 

_grant_image_access() ; 
#if IPRODUCTION 

if( !db->is_magic_db() ) { 
db->Store->ClearPageNo( Jmage ); 

} 

#endif 
} 

IOCB * 

Pagel nf o : :StartRead() 
{ 

PrepareForRead( XM->GetlOCB( this ) ); 

_file->start_read( this ); 
return( _pending ); 

} 

void 

Pagel nfo : : DoWaitForPreimage() 
{ 

Database * db = _file->db; 

if( db->has_separate_checkpoint_log() ) { 
// A preimage has been added to the (separate) checkpoint log 
// and may or may not have been committed yet. 
_assertD( _checkpointJog_pos != 0 ); 
if( _checkpoint_log_pos > 

_file->db->_checkpoint_log->last_committedj30S() ) { 

// Force the preimage to be committed 

_file->db->_checkpoint_log->flush( _checkpoint_log_pos ); 

} 

} else { 

// Preimage is in database file: if it hasn't been committed 
// it will be in cache. 

Pagelnfo * info = XM->lslnCache( NameFor( db_no(), _rollback_page_no ) ); 
if( info 1= NULL ) { 

info->WaitForPending(); 

info->Unlatch(); 

} 

// Ensure that the preimage has been committed by OS. 



_file->flush_fsys_cache(); 
} 

_is.preimage_may_not_be_committecl = FALSE; 

} 

lOCB* 

Pagelnfo::StartWrite( a_bool evict ) 

^***** **************** ************* I 

II Must have exclusive access going in. 
{ 

Su icideOn Fatal Error() ; 

_C u r re ntCo n nect io n-> Add I OCou nt () ; 

WaitForPreimageO; 

_pending = XM->GetlOCB( this ); 

_pending->_is.to_be_evicted = evict; 

_g rant_image_access() ; 

_file->start_write( this ); 

_assertD( !_is.preimage_may_not_be_committed ); 
return( jaending ); 

} 

void 

Pagelnfo::Write( a_bool wait ) 
{ 

StartWrite()->Finish( wait, FALSE ); 

} 

void 

Pagel nf o : : WriteAnd EvictQ 
********** ******** I 

{ 

StartWrite( TRUE )->Finish( FALSE, TRUE ); 
UnlatchO; 

} 

void 

Pagelnfo::Evict() 

^*************** I 
{ 

WaitForPendingO; 
WaitForPreimageO; 
XM->RemoveFromHash( this ); 
UnlatchO; 

} 

void 

Pagel nfo : :write_and_f lush() 

^***** ************** ******* I 

{ 

Write( TRUE ); 

_f ile->f lush_f sys_cache() ; 

} 

a_bool 

Pagelnfo::is_pencling() 



^********************^ 

{ 

if( .pending == (lOCB *) REUSABLE 
II .pending == (lOCB *) IMAGE_MISSING 
II J3ending == (lOCB *) PINNED ) { 
//this should never happen to pages we are interested in 
_assertD( FALSE ); 
return TRUE; 

} else { 

return j3ending != NULL && j3ending->lsActuallyPending(); 
} 

} 

void 

Pagelnfo::FinishLock( a_bool shared ) 

************** **************** I 

{ 

Worker * me = _CurrentWorker; 
Database *db = me->active_db(); 
Connection *c = me->active_con(); 
_db_statistic_incr( db, c, CACHE_READ ); 
Eng->cache_stats->_lookups++ ; 
_engine_statistic( CACHE_READ_ENG ); 
#ifdef SUPPORT_CACHE_COLDSTART 

if( llsColdstartRecordedO && (_real_page_no == page_no() ) ) { 
SetColdstartRecorded( TRUE ); 

db->_coldstart_manager.record_page( _real_page_no ); 

} 

#endif 

if( JustlnstalledO ) { 
_assertD( HaveExclusivelyO && IsAddressableQ ); 
StartRead()->Finish( TRUE, FALSE ); 
if( shared ) { 

ExclusiveToSharedO; 

} 

_assertD( _pending == NULL ); 

} else { 
WaitForPendingO; 

_db_statistic_incr( db, c, CACHE_HITS ); 
Eng->cache_stats->_cache_hits++; 
_engine_statistic( CACHE_HITS_ENG ); 
_assertD( _pending == NULL ); 
XM->MakeAddressable( this ); 
} 

#if IPRODUCTION 

if( IDisableAssertNotFree ) { 
AssertNotFree( db ); 

} 

#endif 

// Since async lOs can complete on another task, 
// a failed lO may have caused the assertion on that 



// other task. We cannot allow the caller to continue 

// because it may assume that all lOs have completed 

// successfully. 

SuicideOnFatalErrorO; 

_g rant_image_access() ; 

TRACE( CacheLock( _name.as_uint ) ); 

switch( _file->get_page_usage( Jmage ) ) { 

case TABLE_PAGE: 
_db_statistic_incr( db, c, CACHE_TABLE_READ ); 
break; 

case INDEX_PAGE: 
_db_statistic_incr( db, c, CACHE_INDEXLEAF_READ ); 
break; 

} 

} 

void 

Pagelnfo::unlock() 

^**************** I 

{ 

TRACE( CacheUnlock( _name.as_uint ) ); 
_revoke_image_access() ; 
U match 0; 

} 

void 

Pagelnfo::AssertNotFree( Database * db ) 
{ 

if( db->has_freej)age_bit_maps() ) { 
_assertD( _file->chkpt_free_map == NULL 
II !_file->chkpt_free_map->lsMember( page_no() ) ); 
_assertD( _file->current_free_map == NULL 
II !_file->current_free_map->lsMember( page_no() ) ); 
_assertD( _file->reusable_free_map == NULL 
II !_file->reusable_free_map->lsMember( page_no() ) ); 
} 

} 

void 

Pagel nfo : :r_complete() 

I******************** I 

{ 

_file->finish_read( this ); 

XM->assert_page_no( _file->db, page_no(), _image ); 
J3ending = NULL; 
_revoke_image_access() ; 

} 

void 

Pagel nfo : :w_complete() 

{ 

_assertD( !_is.preimage_may_not_be_committed ); 



_file->finish_write( this ); 

if( Js.dirty ) { 
// Might not be dirty during cache flushes, etc. 
Js.dirty = FALSE; 
if( Lis_temporary( _file->origin ) ) { 

_file->dec_dirty_pages(); 

_file->db->_auto_ckpt->inc_recovery_io(); 

} 

} 

J3ending = NULL; 
_revoke_image_access() ; 

} 

// PJB FIXME. 
void 

Cachelnfo::SetTablelnfo( a_table_id tid, a_bool is_blob_page ) 

^***********************************************************^ 

{ 

Pagelnfo * info = (Pagelnfo *) this; 
if( tid != NO_TABLE_ID ) { 
info->_tid = tid; 

info->_is.blob_page = is_blob_page; 
info->_is.tracked_table_page = TRUE; 
AddCachedPage( db(), tid, page_no(), !is_blob_page ); 
} 

} 

void 

Cachelnfo::Pin() 

^************** I 

{ 

((Pagelnfo *) this)->Pin(); 

} 

void 

Cachelnfo::Unpin() 

I**************** I 

{ 

((Pagelnfo *) this)->Unpin(); 

} 

void 

Pagelnfo::SetPrelmage( a_page_id page_no ) 
{ 

_is.preimage_may_not_be_committed = TRUE; 
_checkpoint_log_pos = page_no; 

} 

// CacheChain methods, 
void 

CacheChain ::Add( CacheRef * ref ) 

******************* ******* I 

{ 

LatchO; 



ref->_next = _refs; 
_refs = ref; 
ref->_chain = this; 
U n latch 0; 

} 

a_bool 

CacheChain::Remove( CacheRef * remove ) 

^************************************* I 

{ 

a_bool right_chain; 
LatchO; 

if( remove->_chain == this ) { 
CacheRef * ref; 
CacheRef ** pref; 

for( pref = &_refs; (ref = *pref) != NULL; pref = &ref->_next ) { 

jf( ref == remove ) { 
*pref = ref->_next; 
ref->_chain = NULL; 
UnlatchO; 
return TRUE; 

} 

} 

right_chain = TRUE; 

} else { 
right_chain = FALSE; 

} 

UnlatchO; 

return right_chain; 

} 

// Hash lookup table manipulation 
Pagelnfo * 

CacheChain::Fincl( a_cache_name name ) 
{ 

a_cache_name last; 
last.as_uint = 0; 

for( Pagelnfo * info = _heacl; info != NULL; info = info->_next ) { 
a_cache_name current_name = info->_name; 
if( current_name.as_uint == name.as_uint ) return( info ); 
if( current_name.as_uint > name.as_uint ) return( NULL ); 
if( current_name.as_uint < last.as_uint ) return( NULL ); 
//PJBFIXME: Is this safe? 
Iast.as_uint = current_name.as_uint + 1 ; 

} 

return( NULL ); 

} 

Pagelnfo * 

CacheChain::AssuredFind( a_cache_name name ) 

{ 



Pagelnfo * info = Fincl( name ); 

if( info == NULL ) { 
LatchlnfosO; 
info = Fincl( name ); 
UnlatchlnfosO; 

} 

return( info ); 

} 

Pagelnfo * 

CacheChain::FinclOrlnsert( a_cache_name name, Pagelnfo * insert ) 

******************************************* ************** I 

{ 

LatchlnfosO; 
Pagelnfo * info; 
Pagelnfo ** pinfo; 

for( pinfo = &_head; (info = *pinfo) != NULL; pinfo = &info->_next ) { 
if( info->_name.as_uint >= name.as_uint ) { 

if( info->_name.as_uint == name.as_uint ) goto done; 
break; 

} 

} 

insert- >_next = info; 
*pinfo = info = insert; 
done: 

UnlatchlnfosO; 
return info; 

} 

void 

CacheChain::Remove( Pagelnfo * remove ) 

^***** ************** ****************** I 

{ 

LatchlnfosO; 
Pagelnfo * info; 
Pagelnfo ** pinfo; 

for( pinfo = &_head; (info = *pinfo) 1= NULL; pinfo = &info->_next ) { 
if( info == remove ) { 
*pinfo = info->_next; 
break; 

} 

} 

UnlatchlnfosO; 

} 

// Basic cache operations. 
Pagelnfo * 

Cache::lnstall( a_cache_name name, a_bool shared ) 

^***** ***************************** ************** I 

{ 

CacheChain * chain = ChainFor( name ); 
Pagelnfo * info; 

for( info = chain->Find( name );; ) { 



if( info && info->Latch( this, name, shared ) ) break; 
Pagelnfo * alloc = Alloc(); 
info = AddToHash( chain, name, alloc ); 
if( info == alloc ) break; 
AddToReusable( alloc ); 
alloc->Unlatch(); 
} 

_assertD( chain->AssuredFind( name ) == info ); 
return info; 

} 

Cachelnfo * 

Cache: :lnstall( a_database_file * f, a_page_id page_no, a_page_id real_page_no ) 

^****************************************************************** 

{ 

a_cache_name name = NameFor( f->db->id(), page_no ); 
Pagelnfo * info = lnstall( name ); 
if( real_page_no != page_no ) { 
f = file_for_page( f->db, real_page_no ); 
} 

_assertD( info->_name.as_uint == name.as_uint ); 

if( info->Justlnstalled() ) { 
info->_pending = NULL; 
info->_file = f; 

info->_real_page_no = realj)age_no; 
} else { 

// PJB FIXME: should be assertPs 
_assertD( info->_file == f ); 
_assertD( info->_real_page_no == real_page_no ); 
// PJB FIXME: How can we get here? 
//_assertD( !info->is_dirty() ); 
info->WaitForPending(); 
a_bool was_dirty = info->Scrub(); 
_unused( was_dirty ); 
MakeAddressable( info ); 
} 

// PJB FIXME: cf force_hash 
_g rant_image_access() ; 
return( info ); 

} 

Pagelnfo * 

Cache: :lsNotlnCache( a_cache_name name ) 
^***** ************** ******************* I 

{ 

CacheChain * chain = ChainFor( name ); 

Pagelnfo * info = chain->Find( name ); 

if( info == NULL ) { 
Pagelnfo * alloc = Alloc(); 
info = AddToHash( chain, name, alloc ); 
jf( info == alloc ) return info; 
AddToReusable( alloc ); 



alloc->Unlatch(); 
} 

return NULL; 

} 

Pagelnfo * 

Cache::lslnCache( a_cache_name name ) 
^***********************************^ 

{ 

Pagelnfo * info = ChainFor( name )->AssuredFincl( name ); 

if( info && info->TryLatch() ) { 
if( info->HasName( name ) ) return info; 
info->Unlatch(); 

} 

return NULL; 

} 

Pagelnfo * 

Cache: :LatchlflnCache( a_cache_name name ) 

^**************************************** I 

{ 

Pagelnfo * info = lslnCache( name ); 

if( info ) { 
info->WaitForPencling(); 
MakeAcldressable( info ); 

} 

return info; 

} 

a_bool 

Cache::lslmmediatelyLatchable( a_cache_name name ) 

***************************** ************** I 

{ 

Pagelnfo * info = ChainFor( name )->AssuredFind( name ); 
return info 1= NULL && !info->is_pending(); 

} 

a_bool 

Cache::lslOPending( a_cache_name name ) 

^***** ************** ****************** I 

{ 

Pagelnfo * info = ChainFor( name )->AssuredFind( name ); 
return info 1= NULL && info->isj3ending(); 

} 

// Page replacement routines. 
Pagelnfo * 

Cache: :Alloc() 

^************ I 

{ 

Pagelnfo * info; 

unsigned fence = _rover + avail_infos(); 
while( (info = AllocReusableQ) == NULL ) { 
if( (int) (fence - _rover) < 0 || (info = Scavenge()) == NULL ) { 
while( info == NULL ) { 



info = WaitAnyO? Scavenge() : Panic(); 
} 

fence = _rover + avail_infos(); 

} 

_assertD( info->HaveExclusively() ); 
if( info->lsDirty() ) { 

info->StartWrite( TRUE )->Finish( FALSE, TRUE ); 

// PJB TODO: Should we wait if too many pending lOs? 
} else { 

if( info->lslnHash() ) { 
Eng->cache_stats->_cache_replacements++; 
_engine_statistic( CACHE_REPLACEMENTS ); 
info->WaitForPending(); 
RemoveFromHash( info ); 

} else { 
AddToReusable( info ); 

} 

} 

info->Unlatch(); 
} 

MakeAddressable( info ); 
_assertD( !info->_is.dirty ); 
#if defined( LINUX) 

// Linux has VM manager bug in kernels before 2.2.17. 
// An attempt to write to an OS page that is not in memory 
// corrupts first 1 6 bytes of that page. Work around was to 
// touch first byte of the OS page so that it gets allocated into 
// the process memory map. 
if( _touch_page_before_use ) { 
_grant_image_access(); 

char *ptr = (char *) info->_image; 
char *end_of_page = ptr + _db_page_size_max; 
while( ptr < end_of_page ) { 
((int*)ptr)[0] = 0; 
ptr += _os_page_size; 

} 

_revoke_image_access() ; 
} 

#endif 

return( info ); 

} 

void 

Pagelnfo::Pin() 

^************* I 

{ 

_assertD( HaveExclusivelyO ); 
J3ending = (lOCB *) PINNED; 
++XM->_pinned_images; 

_engine_statistic_set( CACHE_PINNED, XM->j3inned_images ); 
TRACE( CachePin( _name.as_uint ) ); 



UnlatchQ; 

} 

void 

Pagelnfo::Unpin() 
^*************** I 

{ 

LatchO; 

_assertD(_pencling == (lOCB *) PINNED ); 
TRACE( CacheUnpin( _name.as_uint ) ); 
jDending = NULL; 
--XM->_pinned_images; 

_engine_statistic_set( CACHE_PINNED, XM->_pinned_images ); 

} 

void * 

Cache: :Alloclmage( Cachelnfo ** pinfo ) 

II Exclusive access, but might be freed by another task. 
{ 

Pagelnfo *info = Alloc(); 

*pinfo = info; 
info->Pin(); 

_grant_image_access(); 
return( info->Jmage ); 

} 

void 

Cache::Freelmage( Cachelnfo * cinfo ) 

***************************** *^ 

{ 

Pagelnfo * info = (Pagelnfo *) cinfo; 
_revoke_image_access() ; 
info->Unpin(); 
AddToReusable( info ); 
info->Unlatch(); 

} 

void * 

Cache: :multi_page_alloc( uint32 num_pages, 
uint32 page_size, 

MultiPageAlloc *handle ) 

^***********************************************^ 

// Alloc a group of contiguous pages, aligned on a page boundary 
// (or on a sector boundary on NT). 

{ 

// First try to allocate from the cache 

// if( successful ) { 

// handle->_aligned = (starting page); 
// handle->_malloced = FALSE; 
//}else{ 
#if defined( WINNT ) 

handle->_unaligned_mem = NULL; 

handle->_aligned_mem = VirtualAlloc( NULL, page_size * num_pages. 



MEM_COMMIT, PAG E_READ WRITE ); 
#else 

hanclle->_unaligned_mem = ut_alloc( (num_pages + 1) * page_size ); 
hanclle->_alignecl_mem = align( hanclle->_unalignecl_mem, page_size ); 
#enclif 

_assertP( 101413, handle->_alignecl_mem != NULL, 

"Unable to allocate a multi-page block of memory" ); 
handle->_mallocecl = TRUE; 
#if IPRODUCTION 

{ 

mp_alloc *mpalloc; 

mpalloc = (mp_alloc *)ut_alloc( sizeof( mp_alloc ) ); 
mpalloc->contents = handle->_aligned_mem; 
mpalloc->next = MultiPageAllocs; 
++ Mu Iti PageCou nt ; 
mpalloc->count = MultiPageCount; 
MultiPageAllocs = mpalloc; 
if( MultiPageCount == WMPmem ) { 
BMPmem( WMPmem ); 
} 

} 

#endif 

return( handle->_aligned_mem ); 
//} 

} 

void 

Cache::multi j)age_free( MultiPageAlloc *handle ) 

^***** ***************************** ************ I 

{ 

#if IPRODUCTION 

{ 

mp_alloc **head; 

mp_alloc *mpalloc; 

if( handle->_aligned_mem != NULL ) { 
for( head = (mp_alloc **)&MultiPageAllocs;; ) { 

mpalloc = *head; 

_assertD( mpalloc 1= NULL ); 

if( mpalloc->contents == handle->_aligned_mem ) { 
if( mpalloc->count == WMPmem ) { 
BMPmem( WMPmem ); 

} 

*head = mpalloc->next; 
ut_free( mpalloc ); 
break; 
} 

head = &mpalloc->next; 

} 

} 

} 

#endif 



if( handle->_mallocecl ) { 
#if definecl( WINNT ) 

VirtualFree( handle->_alignecl_mem, 0, MEM_RELEASE ); 
#else 

ut_free( handle->_unaligned_mem ); 
#endif 

handle->_malloced = FALSE; 
handle->_unaligned_mem = NULL; 
handle->_aligned_mem = NULL; 
} else { 

// Release pages allocated from the cache. 
} 

} 

class ScavengeState { 
public: 

ScavengeStateO 
: threshold( 0 ) 
, counter( 0 ) 

{ 

} 

public: 

unsigned threshold; 
unsigned counter; 

}; 

#if defined( AWE_CACHE ) 
void 

Cache::DoMakeAddressable( Pagelnfo * info ) 

^***** ***************************** ******* I 

II NOTE: We never steal the address space of a dirty page 

// so that don't need to go looking for address space at checkpoint 

//time 
{ 

Pagelnfo ** frame; 
Pagelnfo * owner; 

a_byte * image; 
ScavengeState state; 

for( a_ptrint fence = _frame_rover + _awe_cache._addr_space;; ) { 
if( info->_image 1= NULL ) { 
frame = NULL; 
break; 

} 

a_ptrint rover = _frame_rover++; 

frame = &_frame_owner[rover%_awe_cache._addr_space]; 

owner = *frame; 

if( owner == NULL ) { 

if( CSwapPtr( frame, &owner, info ) ) { 
image = ordinal_to_image( frame - _frame_owner ); 
break; 
} 

} else if( CanScavenge( owner, &state ) ) { 



if( owner->lsDirty() ) { 
owner->StartWrite( TRUE )->Finish( FALSE, TRUE ); 
// PJB TODO: Should we wait if too many pending lOs? 

} else if( owner- >_image != NULL ) { 
image = (a_byte *) owner->_image; 

frame = &_frame_ownerLimages.image_to_ordinal( image )]; 
break; 
} 

owner->Unlatch(); 

} 

if( (int) (fence - rover) < 0 ) { 
if( IWaitAnyO ) { 

DB_Fatal( SQLSTATE_DYNAMIC_MEMORY_EXHAUSTED, NULL ); 
} 

fence += _awe_cache._addr_space; 

} 

} 

void * old = info->_image; 
if( frame != NULL ) { 
for( ;; ) { 

if( old != NULL ) { 
if( owner != NULL ) { 
owner->Unlatch(); 
} else { 

*frame = NULL; 

} 

break; 
} 

if( CSwapPtr( &info->_image, &old, TAG_UNMAPPED( image ) ) ) { 
if( owner != NULL ) { 
*frame = info; 
owner->_image = NULL; 
owner->Unlatch(); 

} 

break; 
} 

} 

} 

image = STRIP_TAG( info->_image ); 
while( info->_image != image ) { 
if( _awe_cache.map_image( image, ordinal( info ) ) ) { 

while( !CSwapPtr( &info->_image, &old, image ) ); 

break; 

} 

} 

} 

#endif 

a_bool 

Cache: :CanScavenge( Pagelnfo * info, ScavengeState * state ) 

******************************************* ********** ^ 



{ 

if( info->lsReusable() && !info->lsLatched() ) { 
if( info->TryLatch() ) { 

if( info->lsReusable() ) { 
return TRUE; 

} 

info->Unlatch(); 

} 

} else if( info->lsReapable() && !info->lslnUse() ) { 
unsigned score = (1 4*info->_score)/1 6; 
if( score > state->threshold ) { 

info->_score = score; 

if( state->counter == 0 ) { 
if( state->threshold < MAX_THRESHOLD ) { 

++state->threshold; 

} 

state->counter = state->threshold*_incr; 

} else { 
--state->counter; 

} 

} else if( info->TryLatch() ) { 

if( info->lsReapable() && !info->lsPinned() ) { 
return TRUE; 

} 

info->Unlatch(); 

} 

} 

return FALSE; 

} 

Pagelnfo * 
Cache: :Scavenge() 

II Attempt to find a page (not necessarily with address space) suitable 

// for reuse. 

{ 

ScavengeState state; 
unsigned i = _rover; 
unsigned j; 

while( (unsigned) (j = _rover++ - i) < availJnfos() ) { 
// PJB FIXME: get rid of mod 
Pagelnfo * info = &_info[(i+j)%avail_infos()]; 
if( CanScavenge( info, &state ) ) { 

return info; 

} 

} 

return NULL; 

} 

Pagelnfo * 
Cache::Panic() 



{ 

#if defined( DYNAMIC_CACHE_SIZE ) 

// We must be absolutely certain that it is impossible to grow 
// the cache and that we didn't fail to scavenge something just 
// because someone else shrank the cache or grew it to its max 
// after we did our first scavenging. 
// 

// However, it is possible to enter the panic code while growing 
// the cache so avoid recursion if we are growing the cache. 
_cache_growth_mutex.get() ; 

#endif 

#if 0 

// DT_Find_memory is currently stubbed out. We can safely returned if 

// we have returned pages. Calling Scavenge will not tell us that. 

DT_Fi nd_memory 0 ; 

Page Info * info = Scavenge(); 
#endif 

Pagelnfo * info = NULL; 
#if defined( DYNAMIC_CACHE_SIZE ) 

#define PANIC_GROWTH_AMOUNT 64 

if( !info && grow_cache_by_images( PANIC_GROWTH_AMOUNT ) ) { 
info = ScavengeQ; 
} 

_cache_growth_mutex.give() ; 
#endif 
if( !info ) { 

DB_Fatal( SQLSTATE_DYNAMIC_MEMORY_EXHAUSTED, 
IDS_ENG_FMSG_DYNAMIC_MEMORY_EXHAUSTED ); 
} 

return( info ); 

} 

// User routines. 
Pagelnfo * 

Cache: :Lock( a_cache_name name, a_bool shared ) 

^********************************************* ^ 

{ 

Pagelnfo * info = LockRaw( name, shared ); 

assertj3age_no( info->_file->db, info->page_no(), info->_image ); 

// FIXME: JCS 

// info->_file->sanity_check( page_no, info->_image, TRUE ); 
return ( info ); 

} 

// PJB FIXME: other lock functions that should be implemented as wrappers that 
// call lock and markdirty as needed. 

// Note that we cannot convert read to write latch without the possibility 

//of giving up info. 

/* PJB FIXME: Implement 

void 

Pagelnfo::Unlock() 
{ 



// _debug( DbgPageUnlock( this ) ); 

U n latch 0; 

if( Hatched ) { 
_vm_protect( this ); 

} 

} 

7 

unsigned 

Cache: :Hint( a_cache_name name ) 

{ 

Pagelnfo * info = lsNotlnCache( name ); 
if( info == NULL ) { 
return( 0 ); 
} 

info->StartRead()->Finish( FALSE, FALSE ); 
info->Unlock(); 

_db_statistic_incr( DBFromlD( name.db_no ), NULL, READ_HINTS ); 
return( 1 ); 

} 

void 

Cache ::Evict( a_cache_name name ) 

^*******************************^ 

H For FreePageByld 
{ 

Pagelnfo * info = lslnCache( name ); 
if( info != NULL ) { 
info->Evict(); 
} 

} 

void 

Cache::Evict( a_database_number db_no, unsigned file_no, a_bool is_scrammed ) 

******************************************* 

// Checkpoint must be done beforehand. 
{ 

#if PRODUCTION 

_unused( is_scrammed ); 
#endif 

for( unsigned i = 0; i < avail_infos(); ++i ) { 
Pagelnfo * info = &_info[i]; 
a_cache_name name = info->name(); 
if( name.as_member.db_no == db_no && 
( file_no == ALL_FILES 

II file_no == _file_num( name.as_member.page_no ) 

II (file_no == MAPPED_PAGES 
&& info->page_no() != info->_real_page_no) ) ) { 

if( info->Latch( this, name ) ) { 
if( info->lsPinned() ) { 

// Heap was left locked: track it down. 

_assertPNR( 101416, FALSE, "Heap left locked at database close." ); 



info->_pending = NULL; 
} else { 

i nf o - > Wai t Fo r Pe nd i ng () ; 

} 

a_bool was_dirty = RemoveFromHash( info ); 
_unused( was_dirty ); //for PRODUCTION builds 

_assertD( !was_dirty || is_scrammed || _is_temporary( name.as_member.page_no ) ); 
info->Unlatch(); 
} 

} 

} 

} 

struct a_flushed { 
Pagelnfo * info; 
a_page_id page_no; 

}; 

static int 

compare_page_ids( const void *elem1 , const void *elem2 ) 
^***** ******************************************* ****** I 

{ 

// Cannot just return the difference between the two page numbers 
// because the page numbers are unsigned and can have the high bit 
// set if dbspace 8 or higher exists. That screws up the ordering 
// and the external checkpoint log relies on it. See flushj3ages. 

a_pagejd pg1 = ((a_flushed *)elem1)->page_no; 
a_page_id pg2 = ((a_flushed *)elem2)->page_no; 
return( (pg1 == pg2) ? 0 : ((pg1 < pg2) ? -1 : 1) ); 

} 

void 

Cache::FlushPages( Database *db, a_flushed *flushed, unsigned n ) 

I*************************************************************** I 

II Flush all marked pages for specified database. 
{ 

// NOTE: When using an external checkpoint log, there is an 
// implicit assumption that the following qsort() is done. If the 
// definition page for the main dbspace is an element of the 
// "infos" set, we must start a write on that definition page 
// before starting an lO on any other page in the set because 
// starting a write on any other page may cause the separate 
// checkpoint log code to attempt to write-lock the definition 
// page when flushing a preimage. Since the "writing" bit is 
// already turned by Cache: :f lush for all of the pages we are 
// about to write, whte-locking the definition page will cause 
// the write-lock by the separate checkpoint log code to hang 
// waiting for the write of the definition page to complete (an lO 
// which has not actually been issued yet). 
qsort( flushed, n, sizeof(flushed[0]), compare_page_ids ); 
_taskData( io_req_type ) = IOREQ_CHKPTWRT; 
for( unsigned i = 0; i < n; ++i ) { 
a_cache_name name = NameFor( db->id(), flushed[i].page_no ); 



Pagelnfo * info = flushecl[i].info; 

if( info->Latch( this, name ) ) { 

if( info->_is.dirty ) { 
info->WaitForPencling(); 
if( info->_is.dirty ) { 

_checksum( info->_image ); // blank padding 

info->StartWrite()->Finish( FALSE, TRUE ); 

} 

} 

info->Unlatch(); 

} 

} 

_taskData( io_req_type ) = IOREQ_UNKNOWN; 
_db_only_statistic_add( db, CHECKPOINT_FLUSH, n ); 

} 

#define FLUSH_MAX 256 

#if !defined(ON_BUILD_MACHINE) && defined( WINNT ) && !defined( UNDER_CE ) 

#define MEASURE_WRITE_TIMES 

#endif 

void 

Cache::DoFlush( p_database db, a_bool flush_temp ) 

^***** ***************************** ************** I 

{ 

ajlushed flushing[FLUSH_MAX]; 

unsigned flush_count = 0; 
#if defined(MEASURE_WRITE_TIMES) 

unsigned flush_total = 0; 

LARGEJNTEGER startjme; 

LARGEJNTEGER stop_time; 

LARGEJNTEGER frequency; 

QueryPerformanceCounter( &start_time ); 
#endif 

a_database_number db_no = db->id(); 

_assertP( 101403, _CurrentWorker->is_forbidding(), 

"FlushCache: worker is not forbidding" ); 
for( a_ptrint i = 0; i < avail_infos(); i++ ) { 
Pagelnfo * info = &_info[i]; 
a_cache_name name = info->name(); 
if( name.as_member.db_no == db_no && info->_is. dirty && 

(flush_temp || !_is_temporary( name.as_member.page_no )) && 
!info->lsPinned() ) { 
flushing[flush_count].info = info; 

flushing[flush_count].page_no = name.as_member.page_no; 
++flush_count; 

} 

if( flush_count == FLUSH_MAX ) { 

FlushPages( db, flushing, flush_count ); 
#if defined(MEASURE_WRITE_TIMES) 

flush_total += flush_count; 
#endif 



flush_count = 0; 

} 

} 

if( flush_count != 0 ) { 

FlushPages( db, flushing, flush_count ); 
#if clefinecl(MEASURE_WRITE_TIMES) 

flush_total += flush_count; 
#enclif 

flush_count = 0; 
} 

WaitAlK db_no); 
// Recompute_stats(); 
#if defined(MEASURE_WRITE_TIMES) 
QueryPerformanceCounter( &stop_time ); 
Query PerformanceFrequency( &frequency ); 
if( flush_total > 0 ) { 

double est = (stop_time.QuadPart - start_time.QuadPart)*1000.0/(frequency.QuadPart*flush_total); 
db->_auto_ckpt->set_write_time( est ); 
} 

#endif 

// PJB TODO: Figure out a better location for this. 
SetPageScoringParametersO; 

} 

void 

Cache::Flush( p_database db ) 

^***************************^ 

// Flush out dirty pages in preparation for a checkpoint. 
{ 

DoFlush( db, FALSE /* dont flush temp */ ); 

} 

void 

Caohe::sa_flush_cache( p_database db ) 

************** ***************** I 

II Implementation of sa_flush_cache internal stored procedure. 

// Write all dirty pages and evict from the cache as many pages as possible 

// that belong to the specified database 

{ 

ForbidO; 

DoFlush( db, TRUE /* flush temp 7 ); 

a_database_number db_no = db->id(); 

for( unsigned i = 0; i < avail_infos(); ++i ) { 
Pagelnfo * info = &_info[i]; 
a_cache_name name = info->name(); 
if( name.as_member.db_no == db_no && !info->lslnUse() ) { 

if( info->Latch( this, name ) ) { 
_assertD( llnfo->_pending && linfo->_is.dirty ); 
RemoveFromHash( info ); 
info->Unlatch(); 

} 

} 



} 

PermitO; 

} 

void 

Cache::FlushCacheForFileDrop( a_clatabase_number clb_no, unsigned file_no ) 

************************************************ ****************** I 

II A checkpoint must be done before this call. 
{ 

Evict( db_no, file_no, FALSE ); 
#if IPRODUCTION 

ChecklfStillUsedAtFileDrop( db_no, file_no ); 
#endif 
} 

#if IPRODUCTION 
void 

Cache::ChecklfStillUsedAtCommit( a_database_number db_no, Cachelnfo *defj3age ) 

^***************************************************************************** I 

{ 

// PJB FIXME: How to avoid spuhous errors? 
#if 1 

_unused( db_no ); 
_unused( def_page ); 
#else 

// Check to see if any pages are still in use. 
for( a_ptrint 1=0; i < availJnfos(); i++ ) { 
Page Info * info = &_info[i]; 
if( info->db_no() == db_no 

&& !Js_temporary( info->page_no() ) 

&& info->lsLocked() 

&& info != (Pagelnfo *) def_page 

&& info->_file->get_page_usage( info->_image ) 1= LOG_PAGE ) { 

cache_error( info, CACHE_ERR_STILL_LOCKED ); 

// We can still trip across this when returning blobs 

// via streams: we call CmdSeqPres::SendMultiPiece 

// with a pointer into a page. This is likely not to 

// cause any grief (other than a potentially unbounded 

// wait while holding a page locked.) PJB 9/14/00. 

// Another way to hit it is while adding a row to 

// a Java index; the deserialize code can call Yield(), 

// which context switches while we have locks. ITB 9 Dec 2002 

} 

} 

#endif 
} 

#endif 
aj)trint 

Cache::Clean( Database *db, unsigned rover, unsigned count ) 

I********************************************************** I 

II Issue an lO for "count" dirty pages in the cache if there are 

// any valid candidates. Called by idle lO and by auto checkpoint code. 



{ 

a_flushed flushing[FLUSH_MAX]; 
unsigned flush_count = 0; 

a_database_number db_no = db == NULL? NO_DB_ID : db->id(); 
if( count > FLUSH_MAX ) { 
count = FLUSH_MAX; 
} 

a_ptrint limit = cache_available_images(); 
if( limit > 500 * count ) { 
limit = 500 * count; 
} 

// Collect a set of candidates: 
unsigned i; 

for( i = rover; (unsigned) (rover - i) < limit; ++rover ) { 
// PJB FIXME: get rid of mod. 
Pagelnfo * info = &_info[(rover + i)%avail_infos()]; 
a_cache_name name = info->name(); 

if( (name.as_member.db_no == db_no || db_no == NO_DB_ID) && 

!_is_temporary( name.as_member.page_no ) && info->_is.dirty && linfo->_pending ) { 
flushing[flush_count].info = info; 

flushing[flush_count].page_no = name.as_member.page_no; 
++flush_count; 

if( flush_count >= count ) break; 

} 

} 

qsort( flushing, flush_count, sizeof(flushing[0]), compare_page_ids ); 

for( i = 0; i < flush_count; ++i ) { 
Pagelnfo * info = flushing[i].info; 
if( info->TryLatch() ) { 

a_cache_name name = info->name(); 

if( (name.as_member.db_no == db_no || db_no == NO_DB_ID) && 
!_is_temporary( name.as_member.page_no ) && info->_is.dirty && !info->_pending ) { 
// PJB FIXME: _vmj)rotect( info ); 
_checksum( info->_image ); // blank padding 
info->StartWrite()->Finish( FALSE, TRUE ); 
_db_only_statistic( info->_file->db, IDLE_WRITES ); 

} 

info->Unlatch(); 

} 

} 

return ( rover ); 

} 

unsigned 

CM_Clean( Database *db, unsigned rover, unsigned count ) 

^***** ******************************************* ****** I 

{ 

// PJB FIXME: get rid of cast. 

return( (unsigned) XI\/l->Clean( db, rover, count ) ); 

} 

// CacheRef operations 



struct AdjustList { 

AdjustListO 
: fixup( NULL ) 

{ 

} 

a_page_id page_no; 
CacheRef *fixup; 

ldlelOTimer::ldlelOTimer() 

: _rover( 0 ) 



void 

ldlelOTimer::dispatch() 

#if defined( DYNAMIC_CACHE_SIZE ) 

// Prevent the cache from shrinking 

PreventSuperForbidO; 
#endif 

_rover = CM_Clean( NULL, _rover, 1 ); 
#if defined( DYNAMIC_CACHE_SIZE ) 

AllowSuperForbidO; 
#endif 
} 

void 

Cache: :adjust( DoAdjust *cb, Database *db, 

aj3age_id pO, a_page_id p1 , a_page_id p2 ) 

{ 

Worker *me = _CurrentWorker; 
a_database_number db_no = db->id(); 
CacheChain *chain; 
CacheRef *ref; 
CacheRef *nref; 
CacheRef **next; 

CacheChain *bogus = me->_bogus_chain; 
AdjustList adjust[2]; 
AdjustList *a; 

a_cache_name name = NameFor( db_no, pO ); 

adjust[0].page_no = p1 ; 

adjust[1].page_no = p2; 

bogus->Latch(); 

chain = ChainFor( name ); 

chain->Latch(); 

for( next = &chain->_refs; (ref = *next) != NULL; ) { 
if( ref->_name.as_uint == name.as_uint ) { 
uint i = cb->do_adjust( ref ); 
if( i == 0 ) { 



next = &ref->_next; 

} else { 
*next = ref->_next; 
// PJB FIXME: does this work? 
if( ref->_is. locked ) { 

// Must be on same connection. 

ref->unlock(); 

} 

a = &adjust[i-1]; 
ref->Jnfo = NULL; 

ref->_name = NameFor( db_no, a->page_no ); 
if( a->page_no == NULL_PAGE ) { 

ref->_chain = NULL; 
} else { 

ref->_next = a->fixup; 

a->fixup = ref ; 

ref->_chain = bogus; 

} 

} 

} else { 

next = &ref->_next; 

} 

} 

chain->Unlatch(); 

for( a = &adjust[0]; a < &adjust[2]; ++a ) { 
if( a->fixup ) { 
chain = ChainFor( NameFor( db_no, a->page_no ) ); 
chain->Latch(); 

for( ref = a->fixup; ref 1= NULL; ref = nref ) { 
nref = ref->_next; 
ref->_chain = chain; 
ref->_next = chain->_refs; 
chain->_refs = ref; 

} 

chain->Unlatch(); 

} 

} 

bogus->Unlatch(); 

} 

void 

Cache: :kick_auto_resize() 
{ 

#if defined( DYNAMIC_CACHE_SIZE ) 

if( _auto_resize ) { 
_auto_resize->kick() ; 

} 

#endif 
} 

void 



Cache: :engine_startup_complete() 

^***** ************** *********** I 

{ 

#if defined( DYNAMIC_CACHE_SIZE ) 

if( _auto_resize ) { 
_auto_resize->enable() ; 

} 

#enclif 
} 

void 

Cache: :cache_message( void ) 
^************************** I 

{ 

uint64 current_size = current_cache_size(); 

startup_msg( IDS_ENG_CACHE_MEMORY_USAGE, (uint32)(current_size/_u64_const(1024)) ); 
#if defined(DYNAMIC_CACHE_SIZE) 

if( !awe_enabled() ) { 
uint64 min_size = minimum_cache_size(); 
uint64 max_size = maximum_cache_size(); 
startup_msg( IDS_ENG_CACHE_SIZE_RANGE, 
(uint32)(min_size/_u64_const(1024)), 
(uint32)(max_size/_u64_const(1 024)) ); 

} 

#endif 

#if defined( AWE_CACHE ) 

if( awe_enabled() ) { 
startup_msg( IDS_ENG_AWE_CACHE_SIZE, 

(uint32)(_awe_cache.phys_mem_size()/(uint64)(1024)), 

(uint32)(_images.total_size()/(uint64)(1 024)) ); 

} 

#endif 
} 

#if 0 

// #def ine VM_PROTECT 

typedef volatile a_ptrint a_pseudo_atomic; 

#if defined( VM_PROTECT ) 

#define _vm_protect( info ) XM->vm_protect( info ) 

#define _vm_protect_nfl^( image ) XM->vm_protect_nfl^( image ) 

#define _vm_protect_noaccess( image ) XM->vm_protect_noaccess( image ) 

#define_vm_temp_protect_rw( image ) DWORD old_access = XM->vm_protect_rw( image ) 

#define_vm_restore_protection( image ) if( ^old_access != PAGE_READWRITE ) XM->vm_do_protect( image, 

^old_access ) 

DWORD vm_do_protect( void *image, DWORD protect ) 

{ 

DWORD old_access; 

Virtual Protect( image, _db_page_size_max, protect, &old_access ); 
return( old_access ); 
} 

DWORD vm_protect_rw( void *image ) 
{ 



DWORD olcl_access; 

VirtualProtect( image, _clb_page_size_max, PAGE_READWRITE, &olcl_access ); 
return( olcl_access ); 
} 

DWORD vm_protect_noaccess( void *image ) 
{ 

DWORD old_access; 

Virtual Protect( image, _db j3age_size_max, PAGE_NOACCESS, &old_access ); 
return ( old_access ); 
} 

void vm_protect( Pagelnfo *info ) 
{ 

if( info->_count || info-> _pending ) { 

vm_protect_rw( info->_image ); 
} else { 

vm_protect_noaccess( info->_image ); 

} 

} 

#else 

#define_vm_protect( info ) 

#define _vm_protect_rw( image ) 

#define _vm_protect_noaccess( image ) 

#define _vm_tempj3rotect_rw( image ) 

#define _vm_restore_protection( image ) 
#endif 
#endif 
void 

Cache: :hint_page_group( PageGroup *scatter, aj3age_id start, uint32 to_hint ) 

{ 

IDatabaseFile * file = scatter->_file; 
_assertD( scatter->_ref_count == 1 ); 

// "start" should be on a reasonable boundary, e.g. a multiple of num_pages. 

_assertD( (_physical_page(start) % scatter->NumBufferPages()) == 0 ); 

if( _physicaLpage( start ) + scatter->NumBufferPages() >= file->_current_dbspace_size ) { 
// Less than a full block until end-of-file. 
return; 

} 

a_database_number db_no = file->db->id(); 
lOCB * iocb = NULL; 
unsigned offset; 
unsigned length; 

for( ; to_hint != 0; to_hint »= 1 , ++start ) { 
if( (to_hint&1) ) { 

Pagelnfo * info = lsNotlnCache( NameFor( db_no, start ) ); 

if( info 1= NULL ) { 
if( iocb == NULL ) { 

iocb = GetlOCB( info ); 

offset = 0; 

} 



iocb->_mask |= 1 « offset; 
info->PrepareForReacl( iocb ); 
scatter->Map( offset, info->_image ); 
info->Unlock(); 
length = ++offset; 
continue; 
} 

} 

if( iocb != NULL ) { 

scatter->Map( offset, NULL ); 
++offset; 

} 

} 

if( iocb != NULL ) { 
if( iocb->_mask == 1 ) { 

file->start_read( iocb->_info ); 
} else { 

file->start_read( iocb->_info, scatter, length ); 

} 

iocb->Unlatch(); 

_clb_statistic_incr( file->clb, NULL, READ_HINTS ); 
} 

} 

#if 0 

#if IPRODUCTION 

void Cache: :_dump_cache_info( void ) 
************** *************** I 

{ 

FILE *out; 
a_cache_index i; 
Page Info *info; 

out = fopen( "c:\\cache.out", "wb" ); 
if( out == NULL){ 
return; 
} 

fprintf( out, " %-8s %-5s %-5s\n", "image", "info", "usage" ); 
for( i=0; i<_config._current._n_infos; i++ ) { 
#if defined(DYNAMIC_CACHE_SIZE) 
if( !awe_enabled() && !_allocation_map.test( i ) ) { 
// page is not committed 
continue; 

} 

#endif 

void *image; 

#if defined( AWE_CACHE ) 
if( awe_enabled() ) { 

image = ordinal_to_image( i ); 

if( image == NULL ) { 
break; 

} 



} else { 

image = orclinal_to_image( i ); 

} 

#else 

image = orclinal_to_image( i ); 
#enclif 

info = _image_toJnfo( image ); 
_vm_temp_protect_rw( image ); 
a_byte usage = (((a_byte *)image)[4] & 0x7); 
_vm_restore_protection( image ); 

fprintf( out, "IMG %08p %08p %cl\n", image, info, usage ); 
} 

fprintf( out, " %-8s %-8s %-8s %5s %s\n", "info", "image", "physmem", "locks", "evicted/trashed" ); 
for( i=0; i<_config._current._n_infos; i++ ) { 
info = _info.get( i ); 

fprintf( out, "INF %08p %08p %08x %5d %s%s\n", 
info, info->_image, info->get_physmem_id( this ), info->_count, 
info->_is.evicted?"e":"", 
info->_is.trashed?T:"" ); 
} 

fprintf( out, "Avail QueueVn" ); 

fprintf( out, "%-8s %-8s\n", "info", "image" ); 

a_pseudo_atomic tail = 0; 

while( _avail.do_dequeue( tail ) 1= NOT_QUEUED ) { 
info = _avail.get( tail ); 

fprintf( out, "%08p %08p\n", info, info->_image ); 
} 

fclose( out ); 

} 

extern "C" void Dump_cache_info( void ); 
void Dump_cache_info( void ) 

{ 

XM->_dump_cache_info(); 

} 

#endif 
#endif 

//dbpcache.h 

// Copyright (c) 2004. Sybase, Inc. All Rights Reserved. 

II ******************************************************************* 

II Copyright 1991-2003 iAnywhere Solutions, Inc. All rights reserved. 
II **************************************************************** 

#ifndef ll_DBPCACHE 
#define ll_DBPCACHE 
// #include "utqueue.h" 
//#include "atomic, h" 
//#include "dbsrvapi.h" 
#include "dbfile.h" 
#include "dbstat.h" 
class DBPage; 



class IDatabasefile; 

class Pagelnfo; 

class PageGroup; 

class MultiPageAlloc; 

class DynamicCacheConfig; 

class an_image_set; 

class Cache; 

class CacheRef; 

class lOCB; 

class CacheChain; 

#define BOGUS_NAME (uint64 (-0)) 

union a_cache_name { 

uint64 as_uint; 

struct { 
uint32 page_no; 
uint32 db_no; 

} as_member; 

}; 

inline a_cache_name NameFor( a_database_number dbjd, a_page_id pagejd ) { 
a_cache_name name; 
name.as_member.page_no = pagejd; 
name.as_member.db_no = dbJd; 
return( name ); 

} 

class DBSRVAPI Cachelnfo { 

public: 

union a_disk_page *disk_page() { 
return( (union a_diskj3age *)_image ); 
} 

DBPage *db_page() { 
return( (DBPage *)_image ); 
} 

IDatabaseFile *file() { 
return(_file ); 
} 

Database *db() { 
return(_file->db); 
} 

void write_and_unlock( Cachelnfo *delay ); 

void write_and_flush(); 

a_bool read_to_write_lock(); 

void write_to_read_lock(); 

void mark_dirty(); 

void unlockO; 

void Pin(); 

void Unpin(); 

void SetTablelnfo( a_table_id tid, a_bool is_blob_page ); 
protected: 

fhend class Cache; 
friend class CacheRef; 



friend class lOCB; 
friend class CacheChain; 
void *_image; 
a_cache_name _name; 
IDatabaseFile *_file; 
public: //PJBTODO: make these protected 
a_page_id page_no() const 
{ 

return _name.as_member.page_no; 
} 

a_database_number db_no() const 
{ 

return (a_database_number)_name.as_member.db_no; 
} 

a_cache_name name() const 
{ 

return _name; 
} 

}; 

class DoAdjust { 
public: 

virtual a_uint do_adjust( CacheRef *ref ) = 0; 

}; 

unsigned CM_Clean( Database *db, unsigned rover, unsigned count ); 

#if !defined( DBTOOLS ) 

DBSRVAPI a_database_file *file_for_page( p_database db, a_page_id pg ); 
DBSRVAPI a_database_file *check_file_for_page( p_database db, a_page_id pg ); 
#endif 

static inline unsigned log2( ajDtrint n ) { 
unsigned I; 

for( I = 0; ((a_ptrint)1 « I) < n; ++I ); 
return( I ); 

} 

class Cachelnterface { 
public: 

Cachelnterface( struct an_engine_parms * ep ); 
virtual ~Cachelnterface(); 
virtual void *Alloclmage( Cachelnfo ** ) = 0; 
virtual void Freelmage( Cachelnfo * info ) = 0; 

virtual Cachelnfo * lnstall( a_database_file * f, a_page_id page_no, a_page_id real_page_no ) = 0; 

virtual void WaitAII( a_database_number db_no ) = 0; 

virtual void WaitForExtend( Pagelnfo * extend ) = 0; 

virtual void WaitUntilClean( IDatabaseFile * file ) = 0; 

virtual a_bool RemoveFromHash( Pagelnfo * info ) = 0; 

virtual Pagelnfo * LatchlflnCache( a_cache_name name ) = 0; 

virtual a_bool lslmmediatelyLatchable( a_cache_name name ) = 0; 

virtual a_bool lslOPending( a_cache_name name ) = 0; 

virtual void PrelO() = 0; 

virtual void PostlO() = 0; 

virtual void evict( Database *db, a J3age_id page_no ) = 0; 



virtual unsigned hint( Database *db, aj3age_id page_no ) = 0; 
#if IPRODUCTION 

virtual void check_for_locked _pages( int k ) = 0; 
#endif 

virtual a_ptrint cache_available_addr( void ) = 0; 

virtual a_ptrint ^virtual ^cache_max() = 0; 

virtual void flush_db_from_cache( p_database db, a_bool is_scrammed ) = 0; 
virtual void flush_mapped_pages( p_database db ) = 0; 

virtual void flush_cache_for_table_drop( p_database db, unsigned file_no ) = 0; 

virtual void flush( p_database db ) = 0; 

virtual void sa_flush_cache( p_database db ) = 0; 

virtual void adjust( DoAdjust *cb, Database *db, a_page_id p1, a jDageJd p2 = NULL_PAGE, a_page_id p3 = 
NULL_PAGE ) = 0; 
virtual unsigned hint( a_page_id page_no ) = 0; 

virtual void hintj3age_group( PageGroup *pagegrp, aj3age_id start_page, uint32 pages_wanted ) = 0; 
virtual void *multi_page_alloc( uint32 num_pages, uint32 page_size, MultiPageAlloc *handle ) = 0; 
virtual void multi_page_free( MultiPageAlloc *handle ) = 0; 
virtual void cache_message() = 0; 
virtual void engine_startup_complete() = 0; 
virtual void kick_auto_resize() = 0; 
virtual DynamicCacheConfig * min_config() = 0; 
virtual DynamicCacheConfig * max_config() = 0; 
virtual DynamicCacheConfig * current_config() = 0; 
virtual DynamicCacheConfig * initial_config() = 0; 
virtual a_bool resize_cache( uint64 newsize ) = 0; 
virtual an_image_set * get_images() = 0; 
unsigned page_bits_max() const { 
return( _db_page_bits_max ); 
} 

unsigned page_size_max() const { 
return( _db_page_size_max ); 

} 

a_ptrint page_mask_max() const { 
return( _db_page_mask_max ); 
} 

uint64 aligned_size( uint64 size ) const { 
return( _round_up_pow2( size, _alignment_amount ) ); 
} 

a_ptrint enough_to_fill_pages( double min_count, a_ptrint item_size ) const { 
return( (a jDtrint) (aligned_size( ((a_ptrint) min_count) * item_size )/item_size) ); 
} 

a_ptrint round_up_ordinal( a_ptrint ordinal ) const { 
return( _round_up_pow2( ordinal, _ordinal_alignment ) ); 
} 

a_ptrint round_down_ordinal( a_ptrint ordinal ) const { 
return( _round_down_pow2( ordinal, _ordinal_alignment ) ); 
} 

protected: 

friend class AWECache; 

unsigned const _db j)age_bits_max; 



unsigned const _clbj3age_size_max; 
a_ptrint const _db_page_mask_max; 
a_ptrint const _os_page_size; 
unsigned const _os_page_bits; 
a_ptrint const _alignment_amount; 
a_ptrint const _ordinal_alignment; 
public: 

virtual Cachelnfo *read_lock( p_database db, a_page_id page_no ) = 0; 

// 1 don't like referring to 'a_disk_page' at this level but it helps with type checking 

Cachelnfo *read_lock( p_database db, aj3age_id page_no, union a_disk_page **ppage ) 

{ 

Cachelnfo *info = read_lock( db, page_no ); 
*ppage = info->disk_page(); 
return( info ); 

} 

virtual Cachelnfo *write_lock( p_database db, a_page_id page_no ) = 0; 

Cachelnfo *write_lock( p_database db, a_page_id page_no, union a_disk J3age **ppage ) 

{ 

Cachelnfo *info = write_lock( db, page_no ); 
*ppage = info->disk_page(); 
return( info ); 

} 

virtual Cachelnfo *write_lock_clean( p_database db, a_page_id page_no ) = 0; 

Cachelnfo *write_lock_clean( p_database db, a_page_id page_no, union a_disk_page **ppage ) 

{ 

Cachelnfo *info = write_lock_clean( db, page_no ); 
*ppage = info->disk_page(); 
return( info ); 

} 

virtual Cachelnfo *writeJock_raw( p_database db, a_page_id page_no ) = 0; 

a_bool read_to_write_lock( Cachelnfo ** pinfo ) { 
Cachelnfo * info = *pinfo; 
if( read_to_write_lock( info ) ) { 

return( TRUE ); 

} 

a_pagejd page_no = info->page_no(); 
p_database db = info->file()->db; 
unlock( info ); 

*pinfo = write_lock( db, page_no ); 
return( FALSE ); 
} 

a_bool read_to_write_lock( Cachelnfo ** pinfo, union a_disk_page **ppage ) { 
if( read_to_write_lock( pinfo ) ) { 
return( TRUE ); 

} 

*ppage = (*pinfo)->disk_page(); 
return( FALSE ); 
} 

public: // PJB TODO: Eliminate these wrappers. 
a_bool read_to_write_lock( Cachelnfo *info ) { 



return info->reacl_to_write_lock(); 
} 

void write_to_reacl_lock( Cachelnfo *info ) { 
inf o->write_to_read_lock() ; 
} 

void mark_dirty( Cachelnfo *info ) { 
info->mark_dirty(); 
} 

void unlock( Cachelnfo *info ) { 
info->unlock(); 
} 

#if IPRODUCTION 

virtual void check_if_still_used_at_commit( p_database db, Cachelnfo *def_page ) = 0; 
#endif 

}; 

extern Cachelnterface *CM; 

class Auto I mage 

{ 

public: 

AutolmageO 

CM->Alloclmage( &_info ); 
-AutolmageO 

releaseQ; 
Cachelnfo *info() 

return( Jnfo ); 
void *image() 

return( (void *)_info->diskj3age() ); 
union a_disk_page *disk_page() 

return( _info->disk_page() ); 
void releaseO 

if( Jnfo 1= NULL ) { 
CM->Freelmage( Jnfo ); 
Jnfo = NULL; 

} 

} 

private: 

Cachelnfo *Jnfo; 

}; 

#endif 



